Speedsy's picture
Upload folder using huggingface_hub
71e96ad verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.613784886449796,
"eval_steps": 500,
"global_step": 17000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0036104993320576237,
"grad_norm": 0.3989824056625366,
"learning_rate": 2.989168502003827e-05,
"loss": 0.0649,
"step": 100
},
{
"epoch": 0.007220998664115247,
"grad_norm": 0.3881397247314453,
"learning_rate": 2.9783370040076542e-05,
"loss": 0.0559,
"step": 200
},
{
"epoch": 0.01083149799617287,
"grad_norm": 0.44458580017089844,
"learning_rate": 2.9675055060114813e-05,
"loss": 0.0518,
"step": 300
},
{
"epoch": 0.014441997328230495,
"grad_norm": 0.30548182129859924,
"learning_rate": 2.9566740080153087e-05,
"loss": 0.051,
"step": 400
},
{
"epoch": 0.018052496660288117,
"grad_norm": 0.32849565148353577,
"learning_rate": 2.9458425100191357e-05,
"loss": 0.0492,
"step": 500
},
{
"epoch": 0.018052496660288117,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5399999999999999,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8333333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.68,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7433333333333333,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.46630480328833107,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6280939153439153,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5443844595515648,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5399999999999999,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.18433333333333332,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3333333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.26199999999999996,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.2676968266290956,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.5823563933514796,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.41831478280269363,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.48481025220537144,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.88,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.4962052617439761,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8453888888888891,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6421320573979945,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.526,
"eval_NanoDBPedia_MaxSim_precision@3": 0.5933333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.5879999999999999,
"eval_NanoDBPedia_MaxSim_recall@1": 0.10310159469520844,
"eval_NanoDBPedia_MaxSim_recall@10": 0.36226534423586193,
"eval_NanoDBPedia_MaxSim_recall@3": 0.16970615713362208,
"eval_NanoDBPedia_MaxSim_recall@5": 0.23326627513699055,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.32,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.46,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.6,
"eval_NanoFiQA2018_MaxSim_map@100": 0.29537856332227364,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.43324603174603177,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.3807739490615844,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.32,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.11599999999999999,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.22,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.18799999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.1334126984126984,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5222063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.283515873015873,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4099285714285714,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 0.98,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7329984056856411,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.95,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.7993054682490036,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16199999999999995,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5066666666666666,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.308,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.81,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.76,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.77,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.4,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.76,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.54,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.62,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5046595651672464,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.49404761904761907,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.556538472242046,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.4,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.07600000000000001,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.18,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.12400000000000003,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.4,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.76,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.54,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.62,
"eval_NanoNQ_MaxSim_accuracy@1": 0.44,
"eval_NanoNQ_MaxSim_accuracy@10": 0.78,
"eval_NanoNQ_MaxSim_accuracy@3": 0.58,
"eval_NanoNQ_MaxSim_accuracy@5": 0.66,
"eval_NanoNQ_MaxSim_map@100": 0.5385312151298993,
"eval_NanoNQ_MaxSim_mrr@10": 0.5382142857142856,
"eval_NanoNQ_MaxSim_ndcg@10": 0.5825753769583893,
"eval_NanoNQ_MaxSim_precision@1": 0.44,
"eval_NanoNQ_MaxSim_precision@10": 0.08,
"eval_NanoNQ_MaxSim_precision@3": 0.2,
"eval_NanoNQ_MaxSim_precision@5": 0.136,
"eval_NanoNQ_MaxSim_recall@1": 0.43,
"eval_NanoNQ_MaxSim_recall@10": 0.74,
"eval_NanoNQ_MaxSim_recall@3": 0.57,
"eval_NanoNQ_MaxSim_recall@5": 0.64,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.38,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.64,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23005580868095027,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5076666666666666,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3049814334003711,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.38,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.14600000000000002,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.3,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.228,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.07966666666666668,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.2996666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18666666666666668,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.23566666666666666,
"eval_runtime": 35.0429,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 500
},
{
"epoch": 0.02166299599234574,
"grad_norm": 0.21628977358341217,
"learning_rate": 2.9350110120229628e-05,
"loss": 0.0467,
"step": 600
},
{
"epoch": 0.025273495324403365,
"grad_norm": 0.2205166220664978,
"learning_rate": 2.92417951402679e-05,
"loss": 0.0451,
"step": 700
},
{
"epoch": 0.02888399465646099,
"grad_norm": 0.19837689399719238,
"learning_rate": 2.9133480160306173e-05,
"loss": 0.0443,
"step": 800
},
{
"epoch": 0.032494493988518613,
"grad_norm": 0.334910124540329,
"learning_rate": 2.9025165180344443e-05,
"loss": 0.0443,
"step": 900
},
{
"epoch": 0.036104993320576234,
"grad_norm": 0.3222765624523163,
"learning_rate": 2.8916850200382714e-05,
"loss": 0.0437,
"step": 1000
},
{
"epoch": 0.036104993320576234,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5233333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8366666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7000000000000001,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7533333333333334,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.47257389610967415,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6275939153439153,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.552169138032717,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5233333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.18833333333333335,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3433333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.26733333333333337,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.2644851334278292,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.591053878834391,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4329692968285171,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.4986754709026564,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.68,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.88,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.49788019464343897,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.7997222222222223,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6449100757034537,
"eval_NanoDBPedia_MaxSim_precision@1": 0.68,
"eval_NanoDBPedia_MaxSim_precision@10": 0.534,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6266666666666667,
"eval_NanoDBPedia_MaxSim_precision@5": 0.604,
"eval_NanoDBPedia_MaxSim_recall@1": 0.10083143548761012,
"eval_NanoDBPedia_MaxSim_recall@10": 0.36378359046666303,
"eval_NanoDBPedia_MaxSim_recall@3": 0.1634110190663407,
"eval_NanoDBPedia_MaxSim_recall@5": 0.24312425398736712,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.32,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.7,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.58,
"eval_NanoFiQA2018_MaxSim_map@100": 0.32391779697745937,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.4390714285714285,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.40152050782871407,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.32,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.122,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.23999999999999996,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.184,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.16341269841269843,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5288730158730159,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.31573809523809526,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4032619047619047,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7316378747088335,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9406666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8003043262414425,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16399999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.4933333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.316,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.82,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.74,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.79,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.34,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.78,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.56,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.62,
"eval_NanoMSMARCO_MaxSim_map@100": 0.48032731239273224,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.4707222222222221,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.5437155651671424,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.34,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.07800000000000001,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.18666666666666668,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.12400000000000003,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.34,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.78,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.56,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.62,
"eval_NanoNQ_MaxSim_accuracy@1": 0.46,
"eval_NanoNQ_MaxSim_accuracy@10": 0.8,
"eval_NanoNQ_MaxSim_accuracy@3": 0.66,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.5654113147365755,
"eval_NanoNQ_MaxSim_mrr@10": 0.5727142857142856,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6091517292060955,
"eval_NanoNQ_MaxSim_precision@1": 0.46,
"eval_NanoNQ_MaxSim_precision@10": 0.084,
"eval_NanoNQ_MaxSim_precision@3": 0.22666666666666668,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.44,
"eval_NanoNQ_MaxSim_recall@10": 0.75,
"eval_NanoNQ_MaxSim_recall@3": 0.64,
"eval_NanoNQ_MaxSim_recall@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.44,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23626888319900533,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5426666666666666,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3134126240494545,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.44,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.14800000000000002,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.228,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.09266666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3036666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2356666666666667,
"eval_runtime": 34.4077,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 1000
},
{
"epoch": 0.03971549265263386,
"grad_norm": 0.25178298354148865,
"learning_rate": 2.8808535220420985e-05,
"loss": 0.0433,
"step": 1100
},
{
"epoch": 0.04332599198469148,
"grad_norm": 0.23704570531845093,
"learning_rate": 2.870022024045926e-05,
"loss": 0.0427,
"step": 1200
},
{
"epoch": 0.0469364913167491,
"grad_norm": 0.23128622770309448,
"learning_rate": 2.8591905260497526e-05,
"loss": 0.0414,
"step": 1300
},
{
"epoch": 0.05054699064880673,
"grad_norm": 0.17750941216945648,
"learning_rate": 2.84835902805358e-05,
"loss": 0.0417,
"step": 1400
},
{
"epoch": 0.05415748998086435,
"grad_norm": 0.3663330376148224,
"learning_rate": 2.837527530057407e-05,
"loss": 0.0418,
"step": 1500
},
{
"epoch": 0.05415748998086435,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5633333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.85,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.71,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7599999999999999,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.4913983960924009,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6536931216931218,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5686178434388155,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5633333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.18800000000000003,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3522222222222222,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.26800000000000007,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.2907379689868088,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.5971262382169605,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4433136349616484,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.49914734690231016,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.92,
"eval_NanoDBPedia_MaxSim_map@100": 0.49357562546287,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8385238095238096,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6412381208162751,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.522,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6466666666666666,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6040000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.10234844884148789,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3512733023176364,
"eval_NanoDBPedia_MaxSim_recall@3": 0.1724770478651281,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2358126528424326,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.38,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.7,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.56,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.62,
"eval_NanoFiQA2018_MaxSim_map@100": 0.3604708658995097,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.4838333333333334,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.42851478706284807,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.38,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.12,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.26,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.188,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.20941269841269838,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5218174603174603,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.3597380952380952,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.42440476190476184,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7473907921355676,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9416666666666665,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8154442539644547,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16799999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.316,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.84,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.79,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.54,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.6,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5290379999331613,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5225,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.5865640509428862,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.18,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.12000000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.54,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.6,
"eval_NanoNQ_MaxSim_accuracy@1": 0.46,
"eval_NanoNQ_MaxSim_accuracy@10": 0.8,
"eval_NanoNQ_MaxSim_accuracy@3": 0.66,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.5811169116483572,
"eval_NanoNQ_MaxSim_mrr@10": 0.5818888888888889,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6180803657604871,
"eval_NanoNQ_MaxSim_precision@1": 0.46,
"eval_NanoNQ_MaxSim_precision@10": 0.08199999999999999,
"eval_NanoNQ_MaxSim_precision@3": 0.22666666666666668,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.45,
"eval_NanoNQ_MaxSim_recall@10": 0.75,
"eval_NanoNQ_MaxSim_recall@3": 0.64,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.44,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.82,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23679818147493928,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5537460317460318,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3218654820859421,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.44,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15600000000000003,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.228,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.09266666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31966666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17766666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2346666666666667,
"eval_runtime": 34.4641,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 1500
},
{
"epoch": 0.05776798931292198,
"grad_norm": 0.4146328866481781,
"learning_rate": 2.8266960320612344e-05,
"loss": 0.0404,
"step": 1600
},
{
"epoch": 0.0613784886449796,
"grad_norm": 0.22433452308177948,
"learning_rate": 2.8158645340650612e-05,
"loss": 0.0417,
"step": 1700
},
{
"epoch": 0.06498898797703723,
"grad_norm": 0.24399086833000183,
"learning_rate": 2.8050330360688882e-05,
"loss": 0.0407,
"step": 1800
},
{
"epoch": 0.06859948730909485,
"grad_norm": 0.24582313001155853,
"learning_rate": 2.7942015380727156e-05,
"loss": 0.0398,
"step": 1900
},
{
"epoch": 0.07220998664115247,
"grad_norm": 0.21846520900726318,
"learning_rate": 2.7833700400765424e-05,
"loss": 0.0401,
"step": 2000
},
{
"epoch": 0.07220998664115247,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5733333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8366666666666668,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7000000000000001,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7600000000000001,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.4954558691252351,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.654723544973545,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5701647723533748,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5733333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.18833333333333335,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3511111111111111,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2700000000000001,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.29383428830535036,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.5944247817150053,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4407697047863623,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5074340013486869,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.8,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.88,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.92,
"eval_NanoDBPedia_MaxSim_map@100": 0.49667412657261784,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8561904761904764,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6499392947127224,
"eval_NanoDBPedia_MaxSim_precision@1": 0.8,
"eval_NanoDBPedia_MaxSim_precision@10": 0.528,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6599999999999998,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08492636475273711,
"eval_NanoDBPedia_MaxSim_recall@10": 0.368397896639239,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17021346681341146,
"eval_NanoDBPedia_MaxSim_recall@5": 0.23345321444132755,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.4,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.68,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.56,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.62,
"eval_NanoFiQA2018_MaxSim_map@100": 0.3752386515183775,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.498,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4353890369325066,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.4,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.11800000000000001,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2533333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.2,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2294126984126984,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5124841269841269,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.35573809523809524,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.439484126984127,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7470006604707692,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9400000000000002,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8150432922871463,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16799999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.31999999999999995,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.84,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.4,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.76,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.54,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.64,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5111944886849614,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.4993492063492062,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.5609544296282215,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.4,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.07600000000000001,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.18,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.128,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.4,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.76,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.54,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.64,
"eval_NanoNQ_MaxSim_accuracy@1": 0.52,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.66,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.6070675662292969,
"eval_NanoNQ_MaxSim_mrr@10": 0.6093888888888889,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6445125326273604,
"eval_NanoNQ_MaxSim_precision@1": 0.52,
"eval_NanoNQ_MaxSim_precision@10": 0.086,
"eval_NanoNQ_MaxSim_precision@3": 0.22666666666666668,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.51,
"eval_NanoNQ_MaxSim_recall@10": 0.77,
"eval_NanoNQ_MaxSim_recall@3": 0.64,
"eval_NanoNQ_MaxSim_recall@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.56,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23555972127538763,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5254126984126983,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.315150047932292,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.154,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.27333333333333326,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.22399999999999998,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31566666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.16866666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2316666666666667,
"eval_runtime": 34.4586,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 2000
},
{
"epoch": 0.07582048597321009,
"grad_norm": 0.2242441624403,
"learning_rate": 2.7725385420803698e-05,
"loss": 0.0404,
"step": 2100
},
{
"epoch": 0.07943098530526772,
"grad_norm": 0.14130032062530518,
"learning_rate": 2.7617070440841968e-05,
"loss": 0.0395,
"step": 2200
},
{
"epoch": 0.08304148463732534,
"grad_norm": 0.23448799550533295,
"learning_rate": 2.7508755460880242e-05,
"loss": 0.0404,
"step": 2300
},
{
"epoch": 0.08665198396938296,
"grad_norm": 0.2834147810935974,
"learning_rate": 2.740044048091851e-05,
"loss": 0.0393,
"step": 2400
},
{
"epoch": 0.09026248330144059,
"grad_norm": 0.13481761515140533,
"learning_rate": 2.7292125500956784e-05,
"loss": 0.0387,
"step": 2500
},
{
"epoch": 0.09026248330144059,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5933333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.85,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7133333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7799999999999999,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5046422854002978,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6703148148148149,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5824113068582328,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5933333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.18999999999999997,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3522222222222222,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.272,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.30895273236129445,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6068976292663578,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.44512809965946304,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5114314896149518,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.86,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.5075443159564952,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8396666666666668,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6570907214204179,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.53,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6666666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.612,
"eval_NanoDBPedia_MaxSim_recall@1": 0.10363702908840146,
"eval_NanoDBPedia_MaxSim_recall@10": 0.36290164861402036,
"eval_NanoDBPedia_MaxSim_recall@3": 0.175363836052016,
"eval_NanoDBPedia_MaxSim_recall@5": 0.24462862022939394,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.42,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.7,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.56,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.66,
"eval_NanoFiQA2018_MaxSim_map@100": 0.38308877064316976,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5085555555555555,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4434745809051622,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.42,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.12,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2533333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.196,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.23941269841269844,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5158174603174603,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.35573809523809524,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4492936507936507,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7417355217035814,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9533333333333335,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.811174764214801,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16599999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.312,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.83,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.75,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.78,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.4,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.56,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.62,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5189147655302867,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5109285714285714,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.578586058618842,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.4,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.18666666666666668,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.124,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.4,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.56,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.62,
"eval_NanoNQ_MaxSim_accuracy@1": 0.56,
"eval_NanoNQ_MaxSim_accuracy@10": 0.86,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.78,
"eval_NanoNQ_MaxSim_map@100": 0.6361385398704932,
"eval_NanoNQ_MaxSim_mrr@10": 0.64115873015873,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6809268605314935,
"eval_NanoNQ_MaxSim_precision@1": 0.56,
"eval_NanoNQ_MaxSim_precision@10": 0.092,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.16,
"eval_NanoNQ_MaxSim_recall@1": 0.55,
"eval_NanoNQ_MaxSim_recall@10": 0.82,
"eval_NanoNQ_MaxSim_recall@3": 0.66,
"eval_NanoNQ_MaxSim_recall@5": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.48,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24043179869776007,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5682460317460317,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32321485545868056,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.48,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.152,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.27333333333333326,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.22800000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.10066666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31266666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.16966666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2346666666666667,
"eval_runtime": 34.5509,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 2500
},
{
"epoch": 0.0938729826334982,
"grad_norm": 0.3274095356464386,
"learning_rate": 2.7183810520995054e-05,
"loss": 0.0397,
"step": 2600
},
{
"epoch": 0.09748348196555584,
"grad_norm": 0.31869104504585266,
"learning_rate": 2.7075495541033328e-05,
"loss": 0.0393,
"step": 2700
},
{
"epoch": 0.10109398129761346,
"grad_norm": 0.3646252751350403,
"learning_rate": 2.6967180561071595e-05,
"loss": 0.0384,
"step": 2800
},
{
"epoch": 0.10470448062967108,
"grad_norm": 0.18200986087322235,
"learning_rate": 2.685886558110987e-05,
"loss": 0.0382,
"step": 2900
},
{
"epoch": 0.1083149799617287,
"grad_norm": 0.2341720163822174,
"learning_rate": 2.675055060114814e-05,
"loss": 0.0381,
"step": 3000
},
{
"epoch": 0.1083149799617287,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5766666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8566666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7133333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7733333333333333,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.4995422745474514,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6636216931216931,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5783086822450157,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5766666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19033333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3566666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2740000000000001,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.29629364145220355,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6097674261653939,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.44708220478636224,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5195347306312362,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.74,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.92,
"eval_NanoDBPedia_MaxSim_map@100": 0.4912491810497416,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8316666666666666,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6437064141395017,
"eval_NanoDBPedia_MaxSim_precision@1": 0.74,
"eval_NanoDBPedia_MaxSim_precision@10": 0.526,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6666666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.5920000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.083182483633856,
"eval_NanoDBPedia_MaxSim_recall@10": 0.37489820778601485,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17775513348007813,
"eval_NanoDBPedia_MaxSim_recall@5": 0.23850203458106845,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.58,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.40834918283620375,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.557,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.475122180569791,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.128,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2733333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.26591269841269843,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5420396825396826,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.37307142857142855,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.48103968253968254,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.94,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 0.98,
"eval_NanoHotpotQA_MaxSim_map@100": 0.751983742319108,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.96,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8174838378035254,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.94,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16599999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.31999999999999995,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.47,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.83,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.75,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.38,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.56,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.64,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5088223622782446,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5002380952380951,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.5710609241230001,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.38,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.18666666666666668,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.128,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.38,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.56,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.64,
"eval_NanoNQ_MaxSim_accuracy@1": 0.5,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.64,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.5920234317069705,
"eval_NanoNQ_MaxSim_mrr@10": 0.5945238095238095,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6422125337539774,
"eval_NanoNQ_MaxSim_precision@1": 0.5,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.22,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.49,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.64,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24482574709444013,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5383015873015872,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32026620308029924,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15200000000000002,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2933333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.24,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3116666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18166666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.24766666666666665,
"eval_runtime": 34.3418,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 3000
},
{
"epoch": 0.11192547929378634,
"grad_norm": 0.18178269267082214,
"learning_rate": 2.664223562118641e-05,
"loss": 0.0382,
"step": 3100
},
{
"epoch": 0.11553597862584396,
"grad_norm": 0.18662074208259583,
"learning_rate": 2.653392064122468e-05,
"loss": 0.0381,
"step": 3200
},
{
"epoch": 0.11914647795790158,
"grad_norm": 0.21615353226661682,
"learning_rate": 2.6425605661262955e-05,
"loss": 0.0385,
"step": 3300
},
{
"epoch": 0.1227569772899592,
"grad_norm": 0.12675096094608307,
"learning_rate": 2.6317290681301226e-05,
"loss": 0.0374,
"step": 3400
},
{
"epoch": 0.12636747662201683,
"grad_norm": 0.19197165966033936,
"learning_rate": 2.6208975701339493e-05,
"loss": 0.0382,
"step": 3500
},
{
"epoch": 0.12636747662201683,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5766666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.85,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.73,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7766666666666665,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5072599415454521,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6686851851851853,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5855533884961566,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5766666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19266666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3544444444444444,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2706666666666667,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.2963482553881734,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6149409192580282,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4638809231176158,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5198395830033461,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.72,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.96,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.88,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.49686617544457556,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.815,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6436666547880592,
"eval_NanoDBPedia_MaxSim_precision@1": 0.72,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5319999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6133333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.5920000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08284350058300854,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3752724996751535,
"eval_NanoDBPedia_MaxSim_recall@3": 0.1702141101342662,
"eval_NanoDBPedia_MaxSim_recall@5": 0.23407718055975915,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.46,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.76,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.40381685563340897,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5628888888888889,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48334160821403654,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.46,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.13399999999999998,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.20800000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.23257936507936505,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5727063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.41640476190476183,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.47329365079365077,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7646492206270432,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9506666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8282183965228874,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.42,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.58,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.66,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5397676865733967,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5324603174603174,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.595451831623388,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.42,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.19333333333333333,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.132,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.42,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.58,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.66,
"eval_NanoNQ_MaxSim_accuracy@1": 0.5,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.6019438108261126,
"eval_NanoNQ_MaxSim_mrr@10": 0.6024047619047619,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6435942189637756,
"eval_NanoNQ_MaxSim_precision@1": 0.5,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.49,
"eval_NanoNQ_MaxSim_recall@10": 0.78,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.44,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.64,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23651590016817553,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5486904761904762,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3190476208647928,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.44,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.152,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.09266666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3116666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17666666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.22166666666666665,
"eval_runtime": 34.4054,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 3500
},
{
"epoch": 0.12997797595407445,
"grad_norm": 0.15763667225837708,
"learning_rate": 2.6100660721377767e-05,
"loss": 0.0365,
"step": 3600
},
{
"epoch": 0.13358847528613207,
"grad_norm": 0.22269487380981445,
"learning_rate": 2.5992345741416038e-05,
"loss": 0.0379,
"step": 3700
},
{
"epoch": 0.1371989746181897,
"grad_norm": 0.2786358892917633,
"learning_rate": 2.588403076145431e-05,
"loss": 0.0376,
"step": 3800
},
{
"epoch": 0.14080947395024732,
"grad_norm": 0.23443731665611267,
"learning_rate": 2.577571578149258e-05,
"loss": 0.0376,
"step": 3900
},
{
"epoch": 0.14441997328230494,
"grad_norm": 0.29361817240715027,
"learning_rate": 2.5667400801530853e-05,
"loss": 0.0378,
"step": 4000
},
{
"epoch": 0.14441997328230494,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.58,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.86,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.73,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7866666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5125269797291013,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6723373015873015,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5873604155199881,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.58,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19166666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3566666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2720000000000001,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3029078605664226,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6136794506318378,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4603223943602566,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5258254401578354,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.74,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5039313030504377,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8310555555555557,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6510528681399917,
"eval_NanoDBPedia_MaxSim_precision@1": 0.74,
"eval_NanoDBPedia_MaxSim_precision@10": 0.534,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6333333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.5880000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08286779831917068,
"eval_NanoDBPedia_MaxSim_recall@10": 0.395703687918011,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17486293759011126,
"eval_NanoDBPedia_MaxSim_recall@5": 0.24699232348669453,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.44,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.76,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.72,
"eval_NanoFiQA2018_MaxSim_map@100": 0.39860499362884094,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5501111111111111,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.47601434186923597,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.44,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.132,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666667,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.212,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.22591269841269843,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5677063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.41640476190476183,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.49329365079365073,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7535915228893489,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9466666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8150800264845377,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16599999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.83,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.38,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.56,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.66,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5204645932391834,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5119603174603174,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.5805837713331857,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.38,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.18666666666666668,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.132,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.38,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.56,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.66,
"eval_NanoNQ_MaxSim_accuracy@1": 0.6,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.66,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.6617670654772172,
"eval_NanoNQ_MaxSim_mrr@10": 0.6583571428571429,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6874242628170635,
"eval_NanoNQ_MaxSim_precision@1": 0.6,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.22666666666666668,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.59,
"eval_NanoNQ_MaxSim_recall@10": 0.78,
"eval_NanoNQ_MaxSim_recall@3": 0.66,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.2368024000895803,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5358730158730158,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3140072224759142,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.22800000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.30866666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18066666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2346666666666667,
"eval_runtime": 34.455,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 4000
},
{
"epoch": 0.14803047261436256,
"grad_norm": 0.29444053769111633,
"learning_rate": 2.5559085821569124e-05,
"loss": 0.0365,
"step": 4100
},
{
"epoch": 0.15164097194642018,
"grad_norm": 0.1578754186630249,
"learning_rate": 2.5450770841607395e-05,
"loss": 0.0362,
"step": 4200
},
{
"epoch": 0.15525147127847783,
"grad_norm": 0.19921699166297913,
"learning_rate": 2.5342455861645665e-05,
"loss": 0.0374,
"step": 4300
},
{
"epoch": 0.15886197061053545,
"grad_norm": 0.22319479286670685,
"learning_rate": 2.523414088168394e-05,
"loss": 0.0359,
"step": 4400
},
{
"epoch": 0.16247246994259307,
"grad_norm": 0.20573937892913818,
"learning_rate": 2.512582590172221e-05,
"loss": 0.0368,
"step": 4500
},
{
"epoch": 0.16247246994259307,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5866666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8533333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7266666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7866666666666667,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5147539581662183,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6747619047619048,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5880064368467515,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5866666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19166666666666668,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3533333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2720000000000001,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.31135713059464004,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.606196675938747,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.46062438585632104,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5248665741052331,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.96,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.92,
"eval_NanoDBPedia_MaxSim_map@100": 0.5096802670686674,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8311904761904763,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6530314597508345,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.536,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6333333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.5880000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.10356341848847507,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3744737064261331,
"eval_NanoDBPedia_MaxSim_recall@3": 0.16934155323316452,
"eval_NanoDBPedia_MaxSim_recall@5": 0.23523912717108084,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.4,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.6,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.66,
"eval_NanoFiQA2018_MaxSim_map@100": 0.3698827794937051,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5177460317460317,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4457635473172924,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.4,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.128,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.26666666666666666,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.196,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.19591269841269843,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5410396825396826,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.3857380952380952,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4452936507936508,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7486485581115798,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9466666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8121871463671069,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16599999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.83,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.78,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.7,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5660062519180166,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5567222222222221,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6101093910474691,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.07800000000000001,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.78,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.7,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6567214901478464,
"eval_NanoNQ_MaxSim_mrr@10": 0.6570238095238097,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6895589099025125,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.57,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.72,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.8,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.58,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.2375844022574939,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5392222222222222,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.31738816669529385,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.152,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2733333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3116666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.16866666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.23866666666666667,
"eval_runtime": 34.6168,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 4500
},
{
"epoch": 0.1660829692746507,
"grad_norm": 0.23380136489868164,
"learning_rate": 2.501751092176048e-05,
"loss": 0.0356,
"step": 4600
},
{
"epoch": 0.1696934686067083,
"grad_norm": 0.21839821338653564,
"learning_rate": 2.490919594179875e-05,
"loss": 0.0364,
"step": 4700
},
{
"epoch": 0.17330396793876593,
"grad_norm": 0.23781996965408325,
"learning_rate": 2.4800880961837025e-05,
"loss": 0.0352,
"step": 4800
},
{
"epoch": 0.17691446727082355,
"grad_norm": 0.14845891296863556,
"learning_rate": 2.4692565981875292e-05,
"loss": 0.0357,
"step": 4900
},
{
"epoch": 0.18052496660288117,
"grad_norm": 0.22429068386554718,
"learning_rate": 2.4584251001913563e-05,
"loss": 0.0366,
"step": 5000
},
{
"epoch": 0.18052496660288117,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.87,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7266666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7999999999999999,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5151475129877401,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6798915343915345,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5944808012823658,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19499999999999995,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3611111111111111,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2753333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.31113213629069836,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6233046253598915,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4560954265396356,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5333331730195064,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.8,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5041547812257818,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8608571428571429,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6610642734764984,
"eval_NanoDBPedia_MaxSim_precision@1": 0.8,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5419999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6599999999999998,
"eval_NanoDBPedia_MaxSim_precision@5": 0.5920000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08554678599815835,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3824547362863331,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17883446399971814,
"eval_NanoDBPedia_MaxSim_recall@5": 0.24259427621227642,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.46,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.40044132380290715,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5597142857142857,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.46798266705946273,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.46,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.126,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.20799999999999996,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.24257936507936506,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5337063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4130714285714286,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.47773809523809524,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.88,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7509885114885115,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9273333333333335,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8152245655403907,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.88,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16999999999999996,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5066666666666667,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.44,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.76,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.84,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.58,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.7,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5660245531403026,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5607777777777777,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6259576411675118,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08399999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.19333333333333333,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.84,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.58,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.7,
"eval_NanoNQ_MaxSim_accuracy@1": 0.56,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.62,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6286150413913572,
"eval_NanoNQ_MaxSim_mrr@10": 0.6313888888888889,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6714618916904364,
"eval_NanoNQ_MaxSim_precision@1": 0.56,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.21333333333333332,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.55,
"eval_NanoNQ_MaxSim_recall@10": 0.81,
"eval_NanoNQ_MaxSim_recall@3": 0.62,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.82,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24066086687758026,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5392777777777777,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32519376875989486,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.158,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.3,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.32366666666666677,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18466666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2396666666666667,
"eval_runtime": 34.3441,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 5000
},
{
"epoch": 0.1841354659349388,
"grad_norm": 0.2954254448413849,
"learning_rate": 2.4475936021951837e-05,
"loss": 0.0358,
"step": 5100
},
{
"epoch": 0.1877459652669964,
"grad_norm": 0.20363792777061462,
"learning_rate": 2.4367621041990108e-05,
"loss": 0.0366,
"step": 5200
},
{
"epoch": 0.19135646459905406,
"grad_norm": 0.13431832194328308,
"learning_rate": 2.4259306062028378e-05,
"loss": 0.0348,
"step": 5300
},
{
"epoch": 0.19496696393111168,
"grad_norm": 0.1899450272321701,
"learning_rate": 2.415099108206665e-05,
"loss": 0.036,
"step": 5400
},
{
"epoch": 0.1985774632631693,
"grad_norm": 0.17159174382686615,
"learning_rate": 2.4042676102104923e-05,
"loss": 0.0337,
"step": 5500
},
{
"epoch": 0.1985774632631693,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5833333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8666666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7333333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.79,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5157306966829615,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6749510582010583,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5942776190870221,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5833333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19566666666666666,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3611111111111111,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2760000000000001,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.30397557063413266,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.623527320516268,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4674726773081907,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5274973417938263,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.74,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.88,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.5082355337876947,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8298333333333333,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6594663797856035,
"eval_NanoDBPedia_MaxSim_precision@1": 0.74,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5459999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6466666666666667,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6000000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08260739205876443,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3852909072245931,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17409796861104884,
"eval_NanoDBPedia_MaxSim_recall@5": 0.23535706663597342,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.41822540550674125,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5748571428571428,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48227359954022864,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.5,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.13,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.20800000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2725793650793651,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5402063492063491,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4130714285714286,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.46996031746031747,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7517991436371655,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9416666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8162048062912852,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16799999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5066666666666666,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.84,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.76,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.84,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.68,
"eval_NanoMSMARCO_MaxSim_map@100": 0.563318847285088,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5576904761904763,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6241100939587895,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08399999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.136,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.84,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.68,
"eval_NanoNQ_MaxSim_accuracy@1": 0.5,
"eval_NanoNQ_MaxSim_accuracy@10": 0.86,
"eval_NanoNQ_MaxSim_accuracy@3": 0.66,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6097475419641843,
"eval_NanoNQ_MaxSim_mrr@10": 0.6139682539682539,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6619736393765515,
"eval_NanoNQ_MaxSim_precision@1": 0.5,
"eval_NanoNQ_MaxSim_precision@10": 0.092,
"eval_NanoNQ_MaxSim_precision@3": 0.22666666666666668,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.49,
"eval_NanoNQ_MaxSim_recall@10": 0.82,
"eval_NanoNQ_MaxSim_recall@3": 0.66,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24305770791689477,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5316904761904762,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3216371955696741,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15400000000000003,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23199999999999998,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3156666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17766666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2396666666666667,
"eval_runtime": 34.4168,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 5500
},
{
"epoch": 0.20218796259522692,
"grad_norm": 0.16788238286972046,
"learning_rate": 2.3934361122143194e-05,
"loss": 0.0347,
"step": 5600
},
{
"epoch": 0.20579846192728454,
"grad_norm": 0.19635850191116333,
"learning_rate": 2.3826046142181464e-05,
"loss": 0.0361,
"step": 5700
},
{
"epoch": 0.20940896125934216,
"grad_norm": 0.2777642607688904,
"learning_rate": 2.3717731162219735e-05,
"loss": 0.0356,
"step": 5800
},
{
"epoch": 0.21301946059139978,
"grad_norm": 0.2335290163755417,
"learning_rate": 2.360941618225801e-05,
"loss": 0.0359,
"step": 5900
},
{
"epoch": 0.2166299599234574,
"grad_norm": 0.1892772614955902,
"learning_rate": 2.3501101202296276e-05,
"loss": 0.0359,
"step": 6000
},
{
"epoch": 0.2166299599234574,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8633333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7400000000000001,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7866666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5199972057131541,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6832962962962963,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5954413366409802,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19233333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3622222222222222,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2793333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3117124934335555,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6192721789376111,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.47061803989119627,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5286769280126661,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.8,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.92,
"eval_NanoDBPedia_MaxSim_map@100": 0.5105400814612312,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8562222222222222,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6560094017910139,
"eval_NanoDBPedia_MaxSim_precision@1": 0.8,
"eval_NanoDBPedia_MaxSim_precision@10": 0.534,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6533333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.608,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08569559552196787,
"eval_NanoDBPedia_MaxSim_recall@10": 0.37159339108598494,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17697014410908246,
"eval_NanoDBPedia_MaxSim_recall@5": 0.23443458394901284,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.66,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4226844305764079,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5793571428571428,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48200944107759136,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.5,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.12399999999999999,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.27591269841269844,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5323730158730159,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4290714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4839603174603175,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7456495503464544,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9383333333333335,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8121368880098485,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16799999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.84,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.75,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.48,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.86,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.66,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5847529440716855,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5813174603174602,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.645716664323037,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.48,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08599999999999998,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.132,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.48,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.86,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.66,
"eval_NanoNQ_MaxSim_accuracy@1": 0.5,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.78,
"eval_NanoNQ_MaxSim_map@100": 0.6120034716420681,
"eval_NanoNQ_MaxSim_mrr@10": 0.6163571428571428,
"eval_NanoNQ_MaxSim_ndcg@10": 0.658681037680987,
"eval_NanoNQ_MaxSim_precision@1": 0.5,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.16,
"eval_NanoNQ_MaxSim_recall@1": 0.49,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24435275618107738,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5281904761904762,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3180945869634035,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.152,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23600000000000002,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31166666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17766666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.24366666666666667,
"eval_runtime": 34.3954,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 6000
},
{
"epoch": 0.22024045925551503,
"grad_norm": 0.19319140911102295,
"learning_rate": 2.339278622233455e-05,
"loss": 0.0347,
"step": 6100
},
{
"epoch": 0.22385095858757267,
"grad_norm": 0.2135615050792694,
"learning_rate": 2.328447124237282e-05,
"loss": 0.0355,
"step": 6200
},
{
"epoch": 0.2274614579196303,
"grad_norm": 0.21347664296627045,
"learning_rate": 2.3176156262411095e-05,
"loss": 0.0356,
"step": 6300
},
{
"epoch": 0.23107195725168792,
"grad_norm": 0.2025032937526703,
"learning_rate": 2.3067841282449362e-05,
"loss": 0.0351,
"step": 6400
},
{
"epoch": 0.23468245658374554,
"grad_norm": 0.19529680907726288,
"learning_rate": 2.2959526302487636e-05,
"loss": 0.0351,
"step": 6500
},
{
"epoch": 0.23468245658374554,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6066666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8533333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.73,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7666666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.519635868856256,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6824060846560847,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5942278559970032,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6066666666666666,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19299999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.35999999999999993,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2773333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3129029696240317,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6143700524579491,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.46632017401438314,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5203639840040152,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.82,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.96,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.92,
"eval_NanoDBPedia_MaxSim_map@100": 0.5136188818828596,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8640476190476192,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6649906845842177,
"eval_NanoDBPedia_MaxSim_precision@1": 0.82,
"eval_NanoDBPedia_MaxSim_precision@10": 0.542,
"eval_NanoDBPedia_MaxSim_precision@3": 0.64,
"eval_NanoDBPedia_MaxSim_precision@5": 0.612,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08617178599815835,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3848472988746787,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17218294884820298,
"eval_NanoDBPedia_MaxSim_recall@5": 0.24355691989710723,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.6,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.66,
"eval_NanoFiQA2018_MaxSim_map@100": 0.3995290488723121,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5531904761904762,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4657946077010935,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.126,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.27999999999999997,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.20800000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2625793650793651,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5337063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.38307142857142856,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.44996031746031745,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7684294835599184,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9516666666666667,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8291004630770893,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33199999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.83,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.66,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5601541534729045,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5537936507936508,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6166917602584153,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08199999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.132,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.82,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.66,
"eval_NanoNQ_MaxSim_accuracy@1": 0.56,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.6365644710355564,
"eval_NanoNQ_MaxSim_mrr@10": 0.6460238095238096,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6741931361010292,
"eval_NanoNQ_MaxSim_precision@1": 0.56,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.54,
"eval_NanoNQ_MaxSim_recall@10": 0.79,
"eval_NanoNQ_MaxSim_recall@3": 0.68,
"eval_NanoNQ_MaxSim_recall@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.58,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.64,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23951917431398495,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5257142857142857,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3145964842601751,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.28,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.30766666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17266666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.23866666666666667,
"eval_runtime": 34.3884,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 6500
},
{
"epoch": 0.23829295591580316,
"grad_norm": 0.22127734124660492,
"learning_rate": 2.2851211322525907e-05,
"loss": 0.0361,
"step": 6600
},
{
"epoch": 0.24190345524786078,
"grad_norm": 0.2083909660577774,
"learning_rate": 2.2742896342564174e-05,
"loss": 0.0352,
"step": 6700
},
{
"epoch": 0.2455139545799184,
"grad_norm": 0.16349641978740692,
"learning_rate": 2.2634581362602448e-05,
"loss": 0.0358,
"step": 6800
},
{
"epoch": 0.24912445391197602,
"grad_norm": 0.22648359835147858,
"learning_rate": 2.252626638264072e-05,
"loss": 0.0339,
"step": 6900
},
{
"epoch": 0.25273495324403367,
"grad_norm": 0.16047881543636322,
"learning_rate": 2.2417951402678993e-05,
"loss": 0.0345,
"step": 7000
},
{
"epoch": 0.25273495324403367,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.62,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8633333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7366666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7933333333333333,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5306273434107898,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6959973544973544,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6031286718687926,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.62,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19233333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.36333333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.28266666666666673,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.32688534141890346,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6159955384691927,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4695157007099097,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5377011799976644,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.5135567174913014,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8512222222222223,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6600142766412922,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.538,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6533333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.612,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08006601676738914,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3759335482754745,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18135610902136318,
"eval_NanoDBPedia_MaxSim_recall@5": 0.25058009585900265,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.6,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.40617291462503247,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.56,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.47003487783543435,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.12399999999999999,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.28,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5323730158730159,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.39307142857142857,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.47396031746031747,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.96,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7810167618009427,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.98,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8412690156145733,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.96,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16999999999999996,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.48,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.5,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.7,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5985974921283231,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.591047619047619,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6449383638398329,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.5,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08199999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.5,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.82,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.7,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6449593212057456,
"eval_NanoNQ_MaxSim_mrr@10": 0.6551666666666667,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6862111587046233,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.81,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.8,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23946085321339317,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.538547619047619,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3163043385769997,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2933333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.244,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3076666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18266666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2516666666666667,
"eval_runtime": 34.3958,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 7000
},
{
"epoch": 0.25634545257609126,
"grad_norm": 0.1770632266998291,
"learning_rate": 2.230963642271726e-05,
"loss": 0.0347,
"step": 7100
},
{
"epoch": 0.2599559519081489,
"grad_norm": 0.1638520210981369,
"learning_rate": 2.2201321442755534e-05,
"loss": 0.0346,
"step": 7200
},
{
"epoch": 0.2635664512402065,
"grad_norm": 0.20997895300388336,
"learning_rate": 2.2093006462793805e-05,
"loss": 0.0342,
"step": 7300
},
{
"epoch": 0.26717695057226415,
"grad_norm": 0.17646686732769012,
"learning_rate": 2.198469148283208e-05,
"loss": 0.0346,
"step": 7400
},
{
"epoch": 0.27078744990432174,
"grad_norm": 0.13323235511779785,
"learning_rate": 2.1876376502870346e-05,
"loss": 0.0339,
"step": 7500
},
{
"epoch": 0.27078744990432174,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8666666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7466666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.79,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5226584558413901,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6892037037037038,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5986422942925828,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19299999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3688888888888888,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2773333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3199769482769577,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6182158926055284,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4748958274605075,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5242282364774133,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.88,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.5051820098055176,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8422142857142858,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6582582598477363,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5379999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6666666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.612,
"eval_NanoDBPedia_MaxSim_recall@1": 0.0786156579157145,
"eval_NanoDBPedia_MaxSim_recall@10": 0.39392233976015456,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17730353619161643,
"eval_NanoDBPedia_MaxSim_recall@5": 0.25174243473749625,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.41695264283642336,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5763571428571428,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4792461388272453,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.5,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.126,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666667,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.20800000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2725793650793651,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5337063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.41640476190476183,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.45996031746031746,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.94,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7627113617376774,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9666666666666667,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8295334400408982,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.94,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16999999999999996,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.31999999999999995,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.47,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.48,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.68,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5783186849700008,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5719365079365079,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6256876610485098,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.48,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.136,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.48,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.68,
"eval_NanoNQ_MaxSim_accuracy@1": 0.54,
"eval_NanoNQ_MaxSim_accuracy@10": 0.86,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6309550748768139,
"eval_NanoNQ_MaxSim_mrr@10": 0.6395238095238096,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6787501217196613,
"eval_NanoNQ_MaxSim_precision@1": 0.54,
"eval_NanoNQ_MaxSim_precision@10": 0.092,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.53,
"eval_NanoNQ_MaxSim_recall@10": 0.82,
"eval_NanoNQ_MaxSim_recall@3": 0.68,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.8,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.64,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.2418309608219084,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5385238095238095,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32037814427144545,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15200000000000002,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.3,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23600000000000002,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31166666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18566666666666662,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.24366666666666667,
"eval_runtime": 34.4207,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 7500
},
{
"epoch": 0.2743979492363794,
"grad_norm": 0.23983386158943176,
"learning_rate": 2.176806152290862e-05,
"loss": 0.0344,
"step": 7600
},
{
"epoch": 0.27800844856843704,
"grad_norm": 0.12345989793539047,
"learning_rate": 2.165974654294689e-05,
"loss": 0.0323,
"step": 7700
},
{
"epoch": 0.28161894790049463,
"grad_norm": 0.13744865357875824,
"learning_rate": 2.155143156298516e-05,
"loss": 0.0333,
"step": 7800
},
{
"epoch": 0.2852294472325523,
"grad_norm": 0.1692848652601242,
"learning_rate": 2.1443116583023432e-05,
"loss": 0.0334,
"step": 7900
},
{
"epoch": 0.2888399465646099,
"grad_norm": 0.2493271678686142,
"learning_rate": 2.1334801603061706e-05,
"loss": 0.0333,
"step": 8000
},
{
"epoch": 0.2888399465646099,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8633333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7266666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7866666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5223246048258647,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6819325396825398,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.597943762210317,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19399999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3633333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2813333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3132578340578435,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6219753859917169,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4642051450032922,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5282493974166109,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.5132208600110311,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8488888888888888,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6632783331852508,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.54,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6666666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6240000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.07830097260102918,
"eval_NanoDBPedia_MaxSim_recall@10": 0.39247930007728615,
"eval_NanoDBPedia_MaxSim_recall@3": 0.17849277478165806,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2530122575155389,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.6,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.40173478604200724,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.558047619047619,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.46595736309174673,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.12399999999999999,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2733333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21200000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5297063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.3790714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.46281746031746024,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7651761099524258,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9416666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.825720921328443,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16999999999999996,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.68,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5698824389845417,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5648571428571428,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6251385797289163,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08199999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.136,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.82,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.68,
"eval_NanoNQ_MaxSim_accuracy@1": 0.56,
"eval_NanoNQ_MaxSim_accuracy@10": 0.86,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6400765054528211,
"eval_NanoNQ_MaxSim_mrr@10": 0.6461349206349206,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6846808789936363,
"eval_NanoNQ_MaxSim_precision@1": 0.56,
"eval_NanoNQ_MaxSim_precision@10": 0.092,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.55,
"eval_NanoNQ_MaxSim_recall@10": 0.82,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.2438569285123614,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5319999999999999,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32288649693390936,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.156,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23600000000000002,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31966666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17766666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.24366666666666667,
"eval_runtime": 34.2651,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 8000
},
{
"epoch": 0.2924504458966675,
"grad_norm": 0.30358925461769104,
"learning_rate": 2.1226486623099976e-05,
"loss": 0.0337,
"step": 8100
},
{
"epoch": 0.2960609452287251,
"grad_norm": 0.1639607846736908,
"learning_rate": 2.1118171643138247e-05,
"loss": 0.0339,
"step": 8200
},
{
"epoch": 0.29967144456078276,
"grad_norm": 0.14756019413471222,
"learning_rate": 2.1009856663176518e-05,
"loss": 0.0332,
"step": 8300
},
{
"epoch": 0.30328194389284036,
"grad_norm": 0.28809478878974915,
"learning_rate": 2.090154168321479e-05,
"loss": 0.0334,
"step": 8400
},
{
"epoch": 0.306892443224898,
"grad_norm": 0.19018882513046265,
"learning_rate": 2.0793226703253062e-05,
"loss": 0.0334,
"step": 8500
},
{
"epoch": 0.306892443224898,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6033333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8566666666666668,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7266666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7799999999999999,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5181186355947971,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6816772486772488,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5943612177699357,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6033333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19499999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.35888888888888887,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.28066666666666673,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.30886450808557014,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6174975638990831,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4641236421320927,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.534215249872515,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.84,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5200576767695506,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8886904761904764,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6744457714395792,
"eval_NanoDBPedia_MaxSim_precision@1": 0.84,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5459999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6666666666666667,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6320000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08694101676738913,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3966123675214827,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18700375755446064,
"eval_NanoDBPedia_MaxSim_recall@5": 0.26266451510810607,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4061127210556784,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5642222222222223,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4790587902440385,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.132,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666667,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21200000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5527063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.41907142857142854,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.46996031746031747,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.96,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 0.98,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7561220990338637,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9383333333333332,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8204120223496649,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.4933333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33199999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.74,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.83,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5640466563503979,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5559126984126983,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.61389390002846,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.54,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.6251166458728457,
"eval_NanoNQ_MaxSim_mrr@10": 0.6333809523809524,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6653573785749974,
"eval_NanoNQ_MaxSim_precision@1": 0.54,
"eval_NanoNQ_MaxSim_precision@10": 0.08800000000000001,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.52,
"eval_NanoNQ_MaxSim_recall@10": 0.79,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.4,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.56,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.62,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23725601448644618,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5095238095238095,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.31299944398287366,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.4,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.154,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2733333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08366666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31566666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.16866666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.22266666666666665,
"eval_runtime": 34.2376,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 8500
},
{
"epoch": 0.31050294255695565,
"grad_norm": 0.2729031443595886,
"learning_rate": 2.068491172329133e-05,
"loss": 0.032,
"step": 8600
},
{
"epoch": 0.31411344188901325,
"grad_norm": 0.16484437882900238,
"learning_rate": 2.0576596743329604e-05,
"loss": 0.0342,
"step": 8700
},
{
"epoch": 0.3177239412210709,
"grad_norm": 0.15732982754707336,
"learning_rate": 2.0468281763367874e-05,
"loss": 0.0337,
"step": 8800
},
{
"epoch": 0.3213344405531285,
"grad_norm": 0.1904761791229248,
"learning_rate": 2.0359966783406145e-05,
"loss": 0.0343,
"step": 8900
},
{
"epoch": 0.32494493988518613,
"grad_norm": 0.2190273404121399,
"learning_rate": 2.0251651803444416e-05,
"loss": 0.0342,
"step": 9000
},
{
"epoch": 0.32494493988518613,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6033333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8366666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.73,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7866666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5203908314922182,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6803584656084657,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.592226345148526,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6033333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19166666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.35888888888888887,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2813333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3160779583779678,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.606568827883319,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4636122120417152,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5257249634219253,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.82,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5127080521927015,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8726666666666667,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6643252998649642,
"eval_NanoDBPedia_MaxSim_precision@1": 0.82,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5399999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6466666666666667,
"eval_NanoDBPedia_MaxSim_precision@5": 0.628,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08588838518844177,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3820399514268984,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18260184367886256,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2507227964045675,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.38,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.7,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.37265427430886094,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5028571428571429,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.43951338629226266,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.38,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.124,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.27999999999999997,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21200000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2019126984126984,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5197063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4024047619047619,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.46996031746031747,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7699553988671636,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.955,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8270302690597099,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16799999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.84,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.5,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.78,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.66,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5867566755201193,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5770238095238096,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6251689178697141,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.5,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.07800000000000001,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.132,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.5,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.78,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.66,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.66,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6408273631155322,
"eval_NanoNQ_MaxSim_mrr@10": 0.6507460317460318,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6827542432070257,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.22666666666666668,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.81,
"eval_NanoNQ_MaxSim_recall@3": 0.65,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.72,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23944322494893172,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5238571428571427,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.31456595459747977,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23600000000000002,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.30766666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17666666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.24366666666666667,
"eval_runtime": 34.3426,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 9000
},
{
"epoch": 0.3285554392172437,
"grad_norm": 0.13607436418533325,
"learning_rate": 2.014333682348269e-05,
"loss": 0.0332,
"step": 9100
},
{
"epoch": 0.3321659385493014,
"grad_norm": 0.1387406289577484,
"learning_rate": 2.003502184352096e-05,
"loss": 0.0337,
"step": 9200
},
{
"epoch": 0.33577643788135897,
"grad_norm": 0.15135791897773743,
"learning_rate": 1.992670686355923e-05,
"loss": 0.033,
"step": 9300
},
{
"epoch": 0.3393869372134166,
"grad_norm": 0.22940665483474731,
"learning_rate": 1.98183918835975e-05,
"loss": 0.0327,
"step": 9400
},
{
"epoch": 0.34299743654547427,
"grad_norm": 0.16107454895973206,
"learning_rate": 1.9710076903635775e-05,
"loss": 0.0332,
"step": 9500
},
{
"epoch": 0.34299743654547427,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6033333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.85,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7333333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.79,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.520401914943866,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.684686507936508,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.59531829229297,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6033333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19266666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3622222222222223,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2800000000000001,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3127918585129206,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6157140433157907,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.46403960711041464,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.533921827961478,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.82,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5180071079823034,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8780555555555556,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6676156988887704,
"eval_NanoDBPedia_MaxSim_precision@1": 0.82,
"eval_NanoDBPedia_MaxSim_precision@10": 0.536,
"eval_NanoDBPedia_MaxSim_precision@3": 0.68,
"eval_NanoDBPedia_MaxSim_precision@5": 0.62,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08617178599815835,
"eval_NanoDBPedia_MaxSim_recall@10": 0.39124457735506246,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18449954742439234,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2529039836418836,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.42,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.38687861310430877,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5315238095238095,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.45301062918338025,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.42,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.126,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666667,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21200000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.21591269841269842,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5263730158730159,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.40907142857142853,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.46996031746031747,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.94,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7746230158730159,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.97,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8400238254568488,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.94,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33199999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.47,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.83,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.573822590760578,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5656904761904762,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6219875840337532,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.66,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.6356945251348831,
"eval_NanoNQ_MaxSim_mrr@10": 0.6442698412698412,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6753303508208952,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.22666666666666668,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.65,
"eval_NanoNQ_MaxSim_recall@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.4,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.58,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.23338563680810664,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.518579365079365,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.31394166537417184,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.4,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.154,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.26,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.22400000000000003,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08466666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31666666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.1606666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2306666666666667,
"eval_runtime": 34.3663,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 9500
},
{
"epoch": 0.34660793587753186,
"grad_norm": 0.16583311557769775,
"learning_rate": 1.9601761923674043e-05,
"loss": 0.0315,
"step": 9600
},
{
"epoch": 0.3502184352095895,
"grad_norm": 0.13860023021697998,
"learning_rate": 1.9493446943712317e-05,
"loss": 0.033,
"step": 9700
},
{
"epoch": 0.3538289345416471,
"grad_norm": 0.24512599408626556,
"learning_rate": 1.9385131963750587e-05,
"loss": 0.0331,
"step": 9800
},
{
"epoch": 0.35743943387370475,
"grad_norm": 0.2128891497850418,
"learning_rate": 1.927681698378886e-05,
"loss": 0.0341,
"step": 9900
},
{
"epoch": 0.36104993320576234,
"grad_norm": 0.26154008507728577,
"learning_rate": 1.916850200382713e-05,
"loss": 0.0327,
"step": 10000
},
{
"epoch": 0.36104993320576234,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.86,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7866666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5255476485937999,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6916137566137565,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6018401416604545,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19399999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3666666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.28066666666666673,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3196467229467324,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6235398686461339,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.47123321613297103,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.530974822319108,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.516965398473738,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8620000000000002,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6601551175464997,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.53,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6733333333333335,
"eval_NanoDBPedia_MaxSim_precision@5": 0.628,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08330097260102919,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38486619600378735,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18766120155973073,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2662219497876635,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.66,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.68,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4172825066995227,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5680238095238095,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48866344422255087,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.13399999999999998,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21200000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.26591269841269843,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5627063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4290714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.46996031746031747,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7610749877663676,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.96,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8307941746748153,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5066666666666667,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.76,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.7,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5731172391763724,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5666111111111111,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6267492047911154,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08199999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.82,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.7,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.72,
"eval_NanoNQ_MaxSim_map@100": 0.6446898521667311,
"eval_NanoNQ_MaxSim_mrr@10": 0.6536031746031745,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6806198090961569,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.08800000000000001,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.79,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24015590728006772,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5394444444444444,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32405909963158885,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.158,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.32366666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18066666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2396666666666667,
"eval_runtime": 34.4193,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 10000
},
{
"epoch": 0.36466043253782,
"grad_norm": 0.17224304378032684,
"learning_rate": 1.90601870238654e-05,
"loss": 0.0338,
"step": 10100
},
{
"epoch": 0.3682709318698776,
"grad_norm": 0.1621134877204895,
"learning_rate": 1.8951872043903673e-05,
"loss": 0.0327,
"step": 10200
},
{
"epoch": 0.37188143120193523,
"grad_norm": 0.2112155258655548,
"learning_rate": 1.8843557063941944e-05,
"loss": 0.0325,
"step": 10300
},
{
"epoch": 0.3754919305339928,
"grad_norm": 0.16299089789390564,
"learning_rate": 1.8735242083980215e-05,
"loss": 0.0342,
"step": 10400
},
{
"epoch": 0.37910242986605047,
"grad_norm": 0.1437709629535675,
"learning_rate": 1.8626927104018485e-05,
"loss": 0.034,
"step": 10500
},
{
"epoch": 0.37910242986605047,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7600000000000001,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8066666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5250638231683108,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6924933862433863,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5982395012957311,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19266666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.37222222222222223,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.28266666666666673,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3127275310275404,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6122499409706624,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4798036763744838,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5457031108704075,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.8,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.94,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.98,
"eval_NanoDBPedia_MaxSim_map@100": 0.5175842432474314,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8733333333333334,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6659156730406096,
"eval_NanoDBPedia_MaxSim_precision@1": 0.8,
"eval_NanoDBPedia_MaxSim_precision@10": 0.538,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6733333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.628,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08511915441921099,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3881266299509582,
"eval_NanoDBPedia_MaxSim_recall@3": 0.19008396300880792,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2718139033176826,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.46,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.66,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4032861116510114,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5576666666666666,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4723093289251709,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.46,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.128,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.20800000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.23257936507936505,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5447063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4290714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4837380952380952,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.94,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7716892389366814,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.97,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8312739326520183,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.94,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.16799999999999998,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.47,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.84,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.74,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5648382275413891,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5568809523809523,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6156380894489959,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.74,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.8,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6494659160794197,
"eval_NanoNQ_MaxSim_mrr@10": 0.6558571428571429,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6802845415488143,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.086,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.78,
"eval_NanoNQ_MaxSim_recall@3": 0.69,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.66,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24351920155393184,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5412222222222222,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32401544215877737,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.156,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.30666666666666664,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3206666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18966666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.23866666666666667,
"eval_runtime": 34.5819,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 10500
},
{
"epoch": 0.3827129291981081,
"grad_norm": 0.1796998232603073,
"learning_rate": 1.851861212405676e-05,
"loss": 0.0323,
"step": 10600
},
{
"epoch": 0.3863234285301657,
"grad_norm": 0.14713527262210846,
"learning_rate": 1.8410297144095026e-05,
"loss": 0.0329,
"step": 10700
},
{
"epoch": 0.38993392786222336,
"grad_norm": 0.1769598424434662,
"learning_rate": 1.83019821641333e-05,
"loss": 0.0328,
"step": 10800
},
{
"epoch": 0.39354442719428095,
"grad_norm": 0.11684510856866837,
"learning_rate": 1.819366718417157e-05,
"loss": 0.0324,
"step": 10900
},
{
"epoch": 0.3971549265263386,
"grad_norm": 0.19939596951007843,
"learning_rate": 1.8085352204209845e-05,
"loss": 0.0321,
"step": 11000
},
{
"epoch": 0.3971549265263386,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.62,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8566666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8033333333333333,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5356165311368197,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.699994708994709,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.608198044715266,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.62,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19399999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.37222222222222223,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2873333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3290911673911768,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6198108680379454,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4780020890728965,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5438711259296438,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5146029768032088,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8566666666666667,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.66281108755539,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.538,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6733333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6360000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08330097260102919,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38449219235465626,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18427443919928416,
"eval_NanoDBPedia_MaxSim_recall@5": 0.261599771450879,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.74,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.42463332750768634,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5811904761904761,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.49366844731475434,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.5,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.132,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666667,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2625793650793651,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5587063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.41907142857142854,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4899603174603175,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7743426768793641,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.96,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8340107971289106,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33199999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.83,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.48,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5854672734672735,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5803333333333334,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6373427054101277,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.48,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08199999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.48,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.82,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.62,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6648529754489415,
"eval_NanoNQ_MaxSim_mrr@10": 0.6735555555555556,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6945403453754027,
"eval_NanoNQ_MaxSim_precision@1": 0.62,
"eval_NanoNQ_MaxSim_precision@10": 0.08800000000000001,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.6,
"eval_NanoNQ_MaxSim_recall@10": 0.79,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.7,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24979995671444383,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5482222222222223,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3268148855070103,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.154,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.3133333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.244,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31566666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.19466666666666668,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2516666666666667,
"eval_runtime": 34.4482,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 11000
},
{
"epoch": 0.4007654258583962,
"grad_norm": 0.11463096737861633,
"learning_rate": 1.7977037224248112e-05,
"loss": 0.0329,
"step": 11100
},
{
"epoch": 0.40437592519045384,
"grad_norm": 0.20800238847732544,
"learning_rate": 1.7868722244286386e-05,
"loss": 0.0329,
"step": 11200
},
{
"epoch": 0.40798642452251144,
"grad_norm": 0.17940069735050201,
"learning_rate": 1.7760407264324657e-05,
"loss": 0.0325,
"step": 11300
},
{
"epoch": 0.4115969238545691,
"grad_norm": 0.1161593496799469,
"learning_rate": 1.7652092284362928e-05,
"loss": 0.0321,
"step": 11400
},
{
"epoch": 0.41520742318662673,
"grad_norm": 0.19153328239917755,
"learning_rate": 1.75437773044012e-05,
"loss": 0.0325,
"step": 11500
},
{
"epoch": 0.41520742318662673,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6033333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8533333333333332,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.75,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8066666666666665,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5270053340816997,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.690882275132275,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.600155555164153,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6033333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19233333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3711111111111111,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2813333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.31492450072451017,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6172971426329156,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.47876976584057335,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5396278056138751,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.94,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.98,
"eval_NanoDBPedia_MaxSim_map@100": 0.5169174144063625,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.86,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6616949369165016,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.534,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6866666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.624,
"eval_NanoDBPedia_MaxSim_recall@1": 0.07830097260102918,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38640983992447775,
"eval_NanoDBPedia_MaxSim_recall@3": 0.19588049980534475,
"eval_NanoDBPedia_MaxSim_recall@5": 0.26213984955626657,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.46,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.66,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4045624909068759,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5585238095238094,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.46983646425668213,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.46,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.12599999999999997,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21200000000000002,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.23257936507936505,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5357063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4290714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.4859603174603174,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.94,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7803834289605401,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.97,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8418884574544292,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.94,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.47,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5732583547734661,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5671666666666667,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6230783125516643,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6445963784178678,
"eval_NanoNQ_MaxSim_mrr@10": 0.6545793650793651,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6852992294819955,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.81,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24231393702508577,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5350238095238095,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3191359303236444,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.152,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31166666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17766666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2396666666666667,
"eval_runtime": 34.495,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 11500
},
{
"epoch": 0.4188179225186843,
"grad_norm": 0.1335674375295639,
"learning_rate": 1.743546232443947e-05,
"loss": 0.0327,
"step": 11600
},
{
"epoch": 0.422428421850742,
"grad_norm": 0.21090449392795563,
"learning_rate": 1.7327147344477743e-05,
"loss": 0.0327,
"step": 11700
},
{
"epoch": 0.42603892118279957,
"grad_norm": 0.1386965811252594,
"learning_rate": 1.721883236451601e-05,
"loss": 0.0326,
"step": 11800
},
{
"epoch": 0.4296494205148572,
"grad_norm": 0.24617333710193634,
"learning_rate": 1.7110517384554284e-05,
"loss": 0.0329,
"step": 11900
},
{
"epoch": 0.4332599198469148,
"grad_norm": 0.1555705964565277,
"learning_rate": 1.7002202404592555e-05,
"loss": 0.0332,
"step": 12000
},
{
"epoch": 0.4332599198469148,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6133333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.85,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7566666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7966666666666667,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5282484697341063,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6964748677248677,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6014662165364829,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6133333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19166666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.36444444444444435,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2813333333333333,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3177275310275405,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6183279471191584,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4768973071931239,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5397705479274165,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.8,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.96,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.98,
"eval_NanoDBPedia_MaxSim_map@100": 0.5173705886529766,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.875,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6558847426017816,
"eval_NanoDBPedia_MaxSim_precision@1": 0.8,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5259999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6599999999999998,
"eval_NanoDBPedia_MaxSim_precision@5": 0.616,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08511915441921099,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3785946668419347,
"eval_NanoDBPedia_MaxSim_recall@3": 0.19264574792064795,
"eval_NanoDBPedia_MaxSim_recall@5": 0.26321852565973725,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.66,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.42085008579126076,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5866666666666667,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48597991633275844,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.5,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.126,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.212,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5407063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4290714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.49773809523809526,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7659158780361733,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9566666666666666,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8324473186545447,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.68,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5647795499370252,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5573809523809524,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6160006672863827,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.136,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.68,
"eval_NanoNQ_MaxSim_accuracy@1": 0.6,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6584798671537803,
"eval_NanoNQ_MaxSim_mrr@10": 0.6720555555555556,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6966201472186576,
"eval_NanoNQ_MaxSim_precision@1": 0.6,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.58,
"eval_NanoNQ_MaxSim_recall@10": 0.81,
"eval_NanoNQ_MaxSim_recall@3": 0.68,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.2420948488334217,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.531079365079365,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32186450712477227,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15600000000000003,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2733333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.24000000000000005,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.32066666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.1696666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.24766666666666665,
"eval_runtime": 34.5767,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 12000
},
{
"epoch": 0.43687041917897246,
"grad_norm": 0.2230769395828247,
"learning_rate": 1.689388742463083e-05,
"loss": 0.0323,
"step": 12100
},
{
"epoch": 0.44048091851103005,
"grad_norm": 0.14988218247890472,
"learning_rate": 1.6785572444669096e-05,
"loss": 0.0327,
"step": 12200
},
{
"epoch": 0.4440914178430877,
"grad_norm": 0.16966967284679413,
"learning_rate": 1.667725746470737e-05,
"loss": 0.0321,
"step": 12300
},
{
"epoch": 0.44770191717514535,
"grad_norm": 0.17524941265583038,
"learning_rate": 1.656894248474564e-05,
"loss": 0.0321,
"step": 12400
},
{
"epoch": 0.45131241650720294,
"grad_norm": 0.14929385483264923,
"learning_rate": 1.646062750478391e-05,
"loss": 0.0319,
"step": 12500
},
{
"epoch": 0.45131241650720294,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.61,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8566666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.75,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7966666666666665,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5292465975656668,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6928637566137565,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6042163390077616,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.61,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19466666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.36666666666666664,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.28066666666666673,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.31784647244889047,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6233098051635165,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.47727983834069737,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5391257430061328,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.8,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.94,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.98,
"eval_NanoDBPedia_MaxSim_map@100": 0.5166253435639543,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8786666666666667,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6629760349630776,
"eval_NanoDBPedia_MaxSim_precision@1": 0.8,
"eval_NanoDBPedia_MaxSim_precision@10": 0.534,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6666666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.616,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08583280294731091,
"eval_NanoDBPedia_MaxSim_recall@10": 0.37898581510808294,
"eval_NanoDBPedia_MaxSim_recall@3": 0.1929409348060893,
"eval_NanoDBPedia_MaxSim_recall@5": 0.26027033105267,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4217013240748118,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5785555555555555,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4876535104260081,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.5,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.12999999999999998,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666667,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2625793650793651,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5482063492063493,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.41907142857142854,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.48881746031746026,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 0.98,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7690877733377732,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9416666666666665,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8309969122346159,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5066666666666666,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.76,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.42,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.64,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5607512406156985,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5559444444444445,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6197437901185515,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.42,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08199999999999999,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.21333333333333332,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.42,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.82,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.64,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.62,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6611965803157284,
"eval_NanoNQ_MaxSim_mrr@10": 0.6695793650793651,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6942936372669689,
"eval_NanoNQ_MaxSim_precision@1": 0.62,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.6,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.64,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24611732348603543,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5327698412698413,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3296341490373473,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.162,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.228,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.33266666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18166666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2356666666666667,
"eval_runtime": 34.4578,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 12500
},
{
"epoch": 0.4549229158392606,
"grad_norm": 0.16993014514446259,
"learning_rate": 1.6352312524822182e-05,
"loss": 0.0326,
"step": 12600
},
{
"epoch": 0.4585334151713182,
"grad_norm": 0.13655556738376617,
"learning_rate": 1.6243997544860456e-05,
"loss": 0.032,
"step": 12700
},
{
"epoch": 0.46214391450337583,
"grad_norm": 0.1385829746723175,
"learning_rate": 1.6135682564898727e-05,
"loss": 0.032,
"step": 12800
},
{
"epoch": 0.4657544138354334,
"grad_norm": 0.1862432211637497,
"learning_rate": 1.6027367584936997e-05,
"loss": 0.0302,
"step": 12900
},
{
"epoch": 0.46936491316749107,
"grad_norm": 0.18993531167507172,
"learning_rate": 1.5919052604975268e-05,
"loss": 0.0311,
"step": 13000
},
{
"epoch": 0.46936491316749107,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6133333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7966666666666665,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5291853935890819,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6927843915343915,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6011754912416274,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6133333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19299999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3666666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2793333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3178557361557455,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6154327801908678,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4771065713961289,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5393938577402076,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.82,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.98,
"eval_NanoDBPedia_MaxSim_map@100": 0.5216451669898365,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8841666666666665,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6687204820040961,
"eval_NanoDBPedia_MaxSim_precision@1": 0.82,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5379999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6666666666666667,
"eval_NanoDBPedia_MaxSim_precision@5": 0.612,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08588838518844177,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3887236652721905,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18990133313867807,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2608790194571186,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4045734660624793,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5621666666666666,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.472577724428551,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.128,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666667,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21600000000000003,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.24257936507936506,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5432063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.40907142857142853,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.48881746031746026,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7718414664634531,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9466666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8305152979072146,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33199999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.83,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.64,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5673404271167428,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5608571428571429,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6190704380054695,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.21333333333333332,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.64,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.62,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6646388536442245,
"eval_NanoNQ_MaxSim_mrr@10": 0.6726349206349207,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6929017726893819,
"eval_NanoNQ_MaxSim_precision@1": 0.62,
"eval_NanoNQ_MaxSim_precision@10": 0.086,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.6,
"eval_NanoNQ_MaxSim_recall@10": 0.79,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.64,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24507298125775562,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5302142857142856,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32326723241505134,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15600000000000003,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.28,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.22,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.32066666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17366666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.22666666666666666,
"eval_runtime": 34.3722,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 13000
},
{
"epoch": 0.47297541249954866,
"grad_norm": 0.20517900586128235,
"learning_rate": 1.5810737625013542e-05,
"loss": 0.0321,
"step": 13100
},
{
"epoch": 0.4765859118316063,
"grad_norm": 0.13332438468933105,
"learning_rate": 1.5702422645051813e-05,
"loss": 0.0318,
"step": 13200
},
{
"epoch": 0.48019641116366396,
"grad_norm": 0.1347808688879013,
"learning_rate": 1.559410766509008e-05,
"loss": 0.032,
"step": 13300
},
{
"epoch": 0.48380691049572155,
"grad_norm": 0.13791468739509583,
"learning_rate": 1.5485792685128354e-05,
"loss": 0.0315,
"step": 13400
},
{
"epoch": 0.4874174098277792,
"grad_norm": 0.1895150989294052,
"learning_rate": 1.5377477705166625e-05,
"loss": 0.0317,
"step": 13500
},
{
"epoch": 0.4874174098277792,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7633333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8033333333333333,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5229389553373291,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6891031746031747,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5964219230611428,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19166666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3711111111111111,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2826666666666666,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3050999393210014,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6120765266706496,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.48052670026417443,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.538852159318658,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.94,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5162775272612334,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.865,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6628438715724281,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.534,
"eval_NanoDBPedia_MaxSim_precision@3": 0.68,
"eval_NanoDBPedia_MaxSim_precision@5": 0.628,
"eval_NanoDBPedia_MaxSim_recall@1": 0.07935360417997654,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38480836637310384,
"eval_NanoDBPedia_MaxSim_recall@3": 0.1824221063469513,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2528510511500431,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.46,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.68,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.40686537336430506,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5662222222222222,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4780733186292386,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.46,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.13,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.3,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21599999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.22257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5499841269841269,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4490714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.49059523809523803,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7614190871572675,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9533333333333335,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8257034622935508,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5066666666666666,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.316,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.76,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.79,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.42,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.64,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5624496527732818,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5558571428571429,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6152965308068652,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.42,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.21333333333333332,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.42,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.64,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.78,
"eval_NanoNQ_MaxSim_map@100": 0.6480636083551373,
"eval_NanoNQ_MaxSim_mrr@10": 0.6571904761904761,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6794552484225348,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.086,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.16,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.78,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.76,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.64,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24255848311274966,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5370158730158731,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.317159106642239,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23199999999999998,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.30766666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18166666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2396666666666667,
"eval_runtime": 34.4346,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 13500
},
{
"epoch": 0.4910279091598368,
"grad_norm": 0.42774638533592224,
"learning_rate": 1.5269162725204895e-05,
"loss": 0.0316,
"step": 13600
},
{
"epoch": 0.49463840849189444,
"grad_norm": 0.13089995086193085,
"learning_rate": 1.5160847745243168e-05,
"loss": 0.0335,
"step": 13700
},
{
"epoch": 0.49824890782395204,
"grad_norm": 0.17979566752910614,
"learning_rate": 1.505253276528144e-05,
"loss": 0.0313,
"step": 13800
},
{
"epoch": 0.5018594071560096,
"grad_norm": 0.1646861582994461,
"learning_rate": 1.494421778531971e-05,
"loss": 0.0317,
"step": 13900
},
{
"epoch": 0.5054699064880673,
"grad_norm": 0.1698364019393921,
"learning_rate": 1.4835902805357983e-05,
"loss": 0.0321,
"step": 14000
},
{
"epoch": 0.5054699064880673,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8433333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.79,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5240862726711031,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6866216931216931,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.5946487421681512,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19133333333333336,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3644444444444445,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2813333333333333,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3115911673911768,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6068815855149128,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.47320936207819214,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5352118578114539,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.9,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5168095797800448,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8473333333333335,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6579277599171298,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.536,
"eval_NanoDBPedia_MaxSim_precision@3": 0.66,
"eval_NanoDBPedia_MaxSim_precision@5": 0.624,
"eval_NanoDBPedia_MaxSim_recall@1": 0.07830097260102918,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38491649721646104,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18074029945328005,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2560092421068186,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.7,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.66,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.41039166814485706,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5656666666666667,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4675693091400738,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.122,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21599999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5107063492063493,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4268492063492063,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.49059523809523803,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.94,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7724926601186367,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.97,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8350675556593273,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.94,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5066666666666667,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.47,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.76,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.42,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.7,
"eval_NanoMSMARCO_MaxSim_map@100": 0.555037241895581,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5475238095238096,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.608813176819059,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.42,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.42,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.7,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.8,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.74,
"eval_NanoNQ_MaxSim_map@100": 0.6459740317063808,
"eval_NanoNQ_MaxSim_mrr@10": 0.6525238095238095,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6774086852909746,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.086,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15200000000000002,
"eval_NanoNQ_MaxSim_recall@1": 0.56,
"eval_NanoNQ_MaxSim_recall@10": 0.78,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.71,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.64,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24381245438111843,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5366825396825396,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3211059661823423,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15400000000000003,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.228,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.31566666666666665,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.18166666666666664,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2346666666666667,
"eval_runtime": 34.3586,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 14000
},
{
"epoch": 0.5090804058201249,
"grad_norm": 0.17132635414600372,
"learning_rate": 1.4727587825396252e-05,
"loss": 0.0318,
"step": 14100
},
{
"epoch": 0.5126909051521825,
"grad_norm": 0.18724673986434937,
"learning_rate": 1.4619272845434522e-05,
"loss": 0.0328,
"step": 14200
},
{
"epoch": 0.5163014044842402,
"grad_norm": 0.17296718060970306,
"learning_rate": 1.4510957865472795e-05,
"loss": 0.0307,
"step": 14300
},
{
"epoch": 0.5199119038162978,
"grad_norm": 0.21140842139720917,
"learning_rate": 1.4402642885511065e-05,
"loss": 0.0326,
"step": 14400
},
{
"epoch": 0.5235224031483554,
"grad_norm": 0.15276139974594116,
"learning_rate": 1.4294327905549338e-05,
"loss": 0.0322,
"step": 14500
},
{
"epoch": 0.5235224031483554,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8533333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7566666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8066666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5338979965602548,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6927301587301589,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6040595007987866,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19299999999999998,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3744444444444444,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2833333333333334,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.32016342846343787,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6163820713888003,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4901987781862523,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5526920677882746,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 0.98,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.94,
"eval_NanoDBPedia_MaxSim_map@100": 0.5172632270115461,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8460000000000001,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6558120932711752,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.532,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6866666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6040000000000001,
"eval_NanoDBPedia_MaxSim_recall@1": 0.07973453903459561,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38391941245978556,
"eval_NanoDBPedia_MaxSim_recall@3": 0.1884545738794188,
"eval_NanoDBPedia_MaxSim_recall@5": 0.252890501967743,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.52,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.7,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.72,
"eval_NanoFiQA2018_MaxSim_map@100": 0.44623922457066234,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.605,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.5041870151434353,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.52,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.128,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.30666666666666664,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21999999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.28257936507936504,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5397063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.46907142857142853,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.510595238095238,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7735191149511956,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9466666666666668,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8344358891619182,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33599999999999997,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.84,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.42,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.64,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.74,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5556047797541441,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5476666666666666,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6092643524667166,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.42,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.21333333333333332,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14800000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.42,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.64,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.74,
"eval_NanoNQ_MaxSim_accuracy@1": 0.62,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6671892599370804,
"eval_NanoNQ_MaxSim_mrr@10": 0.6747460317460318,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6962961864433254,
"eval_NanoNQ_MaxSim_precision@1": 0.62,
"eval_NanoNQ_MaxSim_precision@10": 0.08800000000000001,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.6,
"eval_NanoNQ_MaxSim_recall@10": 0.79,
"eval_NanoNQ_MaxSim_recall@3": 0.69,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.8,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.58,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.68,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24357237313690053,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5363015873015873,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32436146830614826,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.158,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.27999999999999997,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.236,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3246666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17366666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.24266666666666667,
"eval_runtime": 34.4468,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 14500
},
{
"epoch": 0.527132902480413,
"grad_norm": 0.15041430294513702,
"learning_rate": 1.4186012925587608e-05,
"loss": 0.0321,
"step": 14600
},
{
"epoch": 0.5307434018124707,
"grad_norm": 0.12157612293958664,
"learning_rate": 1.407769794562588e-05,
"loss": 0.0308,
"step": 14700
},
{
"epoch": 0.5343539011445283,
"grad_norm": 0.17142465710639954,
"learning_rate": 1.3969382965664151e-05,
"loss": 0.0315,
"step": 14800
},
{
"epoch": 0.5379644004765859,
"grad_norm": 0.208014577627182,
"learning_rate": 1.3861067985702424e-05,
"loss": 0.0324,
"step": 14900
},
{
"epoch": 0.5415748998086435,
"grad_norm": 0.10315755754709244,
"learning_rate": 1.3752753005740694e-05,
"loss": 0.0305,
"step": 15000
},
{
"epoch": 0.5415748998086435,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6033333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8566666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7566666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8066666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.528898049838572,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.690600529100529,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6021844531577661,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6033333333333334,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19366666666666665,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.37333333333333335,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.284,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.31367220039326243,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6205302102425817,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4847918536606837,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5503413234689233,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5152786026732231,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8591666666666667,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6597974404510716,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.534,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6866666666666665,
"eval_NanoDBPedia_MaxSim_precision@5": 0.612,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08078717061354299,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38619713447136306,
"eval_NanoDBPedia_MaxSim_recall@3": 0.19201302672600729,
"eval_NanoDBPedia_MaxSim_recall@5": 0.26056381382941296,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.68,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.72,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4231396409519793,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5723333333333332,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48979461142348696,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.132,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.3,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.22399999999999998,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5563174603174602,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4490714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.5128174603174602,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7795880890244439,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.96,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8402347971226211,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.52,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33199999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.78,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.83,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.42,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.62,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5546270755729825,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5467142857142856,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6080921371293186,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.42,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.20666666666666667,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.42,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.62,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.6,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.78,
"eval_NanoNQ_MaxSim_map@100": 0.6600318279764187,
"eval_NanoNQ_MaxSim_mrr@10": 0.6695,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6944545361799618,
"eval_NanoNQ_MaxSim_precision@1": 0.6,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.16,
"eval_NanoNQ_MaxSim_recall@1": 0.58,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.69,
"eval_NanoNQ_MaxSim_recall@5": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.8,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.62,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24072306283238448,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5358888888888889,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32073319664013694,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.15600000000000003,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23199999999999998,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.32066666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.17766666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.23866666666666667,
"eval_runtime": 34.3717,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 15000
},
{
"epoch": 0.5451853991407012,
"grad_norm": 0.17434610426425934,
"learning_rate": 1.3644438025778967e-05,
"loss": 0.0324,
"step": 15100
},
{
"epoch": 0.5487958984727588,
"grad_norm": 0.13397444784641266,
"learning_rate": 1.3536123045817237e-05,
"loss": 0.0315,
"step": 15200
},
{
"epoch": 0.5524063978048164,
"grad_norm": 0.150449737906456,
"learning_rate": 1.3427808065855508e-05,
"loss": 0.0311,
"step": 15300
},
{
"epoch": 0.5560168971368741,
"grad_norm": 0.2947181463241577,
"learning_rate": 1.331949308589378e-05,
"loss": 0.0317,
"step": 15400
},
{
"epoch": 0.5596273964689317,
"grad_norm": 0.18219080567359924,
"learning_rate": 1.321117810593205e-05,
"loss": 0.0309,
"step": 15500
},
{
"epoch": 0.5596273964689317,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8533333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7433333333333333,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8033333333333332,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5294326308657656,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6903148148148147,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6013613737191356,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6066666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19299999999999995,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3644444444444444,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2813333333333333,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.31992220039326247,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.617942842921794,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4708263870115356,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5503854291174196,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.94,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5141567253738721,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8578571428571428,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6540979805725969,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.5299999999999999,
"eval_NanoDBPedia_MaxSim_precision@3": 0.68,
"eval_NanoDBPedia_MaxSim_precision@5": 0.6,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08078717061354299,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38078404165774815,
"eval_NanoDBPedia_MaxSim_recall@3": 0.19722022683111828,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2630506699426126,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.64,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.72,
"eval_NanoFiQA2018_MaxSim_map@100": 0.41254237536011445,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5656666666666667,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4769588254780853,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.128,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.2866666666666666,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21999999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25007936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5382063492063492,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.41907142857142854,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.510595238095238,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7680798588474608,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9433333333333335,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8309120194477089,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.172,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.33599999999999997,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.86,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.84,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5753959541336626,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5677460317460317,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6234410064659702,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.6,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6621104682815647,
"eval_NanoNQ_MaxSim_mrr@10": 0.6659365079365079,
"eval_NanoNQ_MaxSim_ndcg@10": 0.694551389494681,
"eval_NanoNQ_MaxSim_precision@1": 0.6,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.59,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24431040319791847,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5413492063492064,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3282070208557713,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.16,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2733333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.32866666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.16866666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2386666666666667,
"eval_runtime": 34.4733,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 15500
},
{
"epoch": 0.5632378958009893,
"grad_norm": 0.2131834477186203,
"learning_rate": 1.3102863125970323e-05,
"loss": 0.0322,
"step": 15600
},
{
"epoch": 0.5668483951330469,
"grad_norm": 0.13113602995872498,
"learning_rate": 1.2994548146008594e-05,
"loss": 0.0314,
"step": 15700
},
{
"epoch": 0.5704588944651046,
"grad_norm": 0.1361074149608612,
"learning_rate": 1.2886233166046864e-05,
"loss": 0.0312,
"step": 15800
},
{
"epoch": 0.5740693937971622,
"grad_norm": 0.2362322360277176,
"learning_rate": 1.2777918186085135e-05,
"loss": 0.0301,
"step": 15900
},
{
"epoch": 0.5776798931292197,
"grad_norm": 0.15715058147907257,
"learning_rate": 1.2669603206123407e-05,
"loss": 0.0316,
"step": 16000
},
{
"epoch": 0.5776798931292197,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.61,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8566666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7466666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7999999999999999,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5329125189767242,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6908743386243387,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.602973585199654,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.61,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19300000000000003,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.36666666666666664,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2826666666666666,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.32283886705992915,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6160080523895414,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4784274912213355,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5500143451360414,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.8,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.94,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.96,
"eval_NanoDBPedia_MaxSim_map@100": 0.5286285310884441,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8705555555555557,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6698534967697684,
"eval_NanoDBPedia_MaxSim_precision@1": 0.8,
"eval_NanoDBPedia_MaxSim_precision@10": 0.536,
"eval_NanoDBPedia_MaxSim_precision@3": 0.68,
"eval_NanoDBPedia_MaxSim_precision@5": 0.612,
"eval_NanoDBPedia_MaxSim_recall@1": 0.10078717061354299,
"eval_NanoDBPedia_MaxSim_recall@10": 0.38800863179756623,
"eval_NanoDBPedia_MaxSim_recall@3": 0.19682685208991746,
"eval_NanoDBPedia_MaxSim_recall@5": 0.258824166054344,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.5,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.68,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.72,
"eval_NanoFiQA2018_MaxSim_map@100": 0.4240652086517142,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5813333333333333,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48685797628778266,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.5,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.126,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.3,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21999999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.2625793650793651,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5433730158730159,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4490714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.510595238095238,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.92,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7765272955432649,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9566666666666667,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8348237890721252,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.92,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.336,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.46,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.84,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.78,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.6,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5606473245064795,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5503333333333333,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6061357635735324,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.07800000000000001,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.2,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.78,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.6,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.6,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.78,
"eval_NanoNQ_MaxSim_map@100": 0.6681879355431987,
"eval_NanoNQ_MaxSim_mrr@10": 0.6725,
"eval_NanoNQ_MaxSim_ndcg@10": 0.7019653954825936,
"eval_NanoNQ_MaxSim_precision@1": 0.6,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.16,
"eval_NanoNQ_MaxSim_recall@1": 0.59,
"eval_NanoNQ_MaxSim_recall@10": 0.81,
"eval_NanoNQ_MaxSim_recall@3": 0.69,
"eval_NanoNQ_MaxSim_recall@5": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.4,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.8,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.56,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.62,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.2394188185272444,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5138571428571429,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.31820509001212194,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.4,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.158,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.26666666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.22399999999999998,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08366666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3246666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.16466666666666668,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.2306666666666667,
"eval_runtime": 34.5198,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 16000
},
{
"epoch": 0.5812903924612774,
"grad_norm": 0.07369329035282135,
"learning_rate": 1.2561288226161678e-05,
"loss": 0.0309,
"step": 16100
},
{
"epoch": 0.584900891793335,
"grad_norm": 0.14647921919822693,
"learning_rate": 1.2452973246199949e-05,
"loss": 0.0297,
"step": 16200
},
{
"epoch": 0.5885113911253926,
"grad_norm": 0.16381925344467163,
"learning_rate": 1.2344658266238221e-05,
"loss": 0.0319,
"step": 16300
},
{
"epoch": 0.5921218904574502,
"grad_norm": 0.14130234718322754,
"learning_rate": 1.2236343286276492e-05,
"loss": 0.0305,
"step": 16400
},
{
"epoch": 0.5957323897895079,
"grad_norm": 0.16018670797348022,
"learning_rate": 1.2128028306314764e-05,
"loss": 0.0309,
"step": 16500
},
{
"epoch": 0.5957323897895079,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.6,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8533333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7400000000000001,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.8066666666666666,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5301678457480149,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6859007936507938,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6033352593022381,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.6,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19633333333333336,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3655555555555556,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.2833333333333333,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.3167025034235655,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.6200974556288524,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4719466015951799,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5452898516439584,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.76,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.98,
"eval_NanoDBPedia_MaxSim_map@100": 0.5217728515497932,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8516666666666667,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6724916384352155,
"eval_NanoDBPedia_MaxSim_precision@1": 0.76,
"eval_NanoDBPedia_MaxSim_precision@10": 0.548,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6866666666666668,
"eval_NanoDBPedia_MaxSim_precision@5": 0.624,
"eval_NanoDBPedia_MaxSim_recall@1": 0.07896898879536116,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3997117179000994,
"eval_NanoDBPedia_MaxSim_recall@3": 0.1869415143329846,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2624772051018455,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.66,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.72,
"eval_NanoFiQA2018_MaxSim_map@100": 0.41945754925956363,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5673333333333332,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.4862859045506256,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.132,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.29333333333333333,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21999999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.25257936507936507,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5522063492063493,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4390714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.510595238095238,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.767400174283261,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9433333333333335,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8270274923913367,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.324,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.81,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.46,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.78,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.58,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.72,
"eval_NanoMSMARCO_MaxSim_map@100": 0.56932758537367,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5601666666666667,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6130579735117773,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.46,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.07800000000000001,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.19333333333333333,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.14400000000000002,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.46,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.78,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.58,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.72,
"eval_NanoNQ_MaxSim_accuracy@1": 0.58,
"eval_NanoNQ_MaxSim_accuracy@10": 0.84,
"eval_NanoNQ_MaxSim_accuracy@3": 0.7,
"eval_NanoNQ_MaxSim_accuracy@5": 0.76,
"eval_NanoNQ_MaxSim_map@100": 0.6590040469326119,
"eval_NanoNQ_MaxSim_mrr@10": 0.6631904761904763,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6957225299673228,
"eval_NanoNQ_MaxSim_precision@1": 0.58,
"eval_NanoNQ_MaxSim_precision@10": 0.09,
"eval_NanoNQ_MaxSim_precision@3": 0.24,
"eval_NanoNQ_MaxSim_precision@5": 0.15600000000000003,
"eval_NanoNQ_MaxSim_recall@1": 0.57,
"eval_NanoNQ_MaxSim_recall@10": 0.81,
"eval_NanoNQ_MaxSim_recall@3": 0.69,
"eval_NanoNQ_MaxSim_recall@5": 0.73,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.78,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.58,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.66,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24404486708919013,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5297142857142858,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.32542601695715057,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.16,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.26666666666666666,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23200000000000004,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.32866666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.16566666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.23866666666666667,
"eval_runtime": 35.6054,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 16500
},
{
"epoch": 0.5993428891215655,
"grad_norm": 0.20602360367774963,
"learning_rate": 1.2019713326353035e-05,
"loss": 0.0312,
"step": 16600
},
{
"epoch": 0.6029533884536231,
"grad_norm": 0.24782870709896088,
"learning_rate": 1.1911398346391307e-05,
"loss": 0.0305,
"step": 16700
},
{
"epoch": 0.6065638877856807,
"grad_norm": 0.1552240401506424,
"learning_rate": 1.1803083366429578e-05,
"loss": 0.0306,
"step": 16800
},
{
"epoch": 0.6101743871177384,
"grad_norm": 0.20471926033496857,
"learning_rate": 1.169476838646785e-05,
"loss": 0.0314,
"step": 16900
},
{
"epoch": 0.613784886449796,
"grad_norm": 0.1991502344608307,
"learning_rate": 1.158645340650612e-05,
"loss": 0.0308,
"step": 17000
},
{
"epoch": 0.613784886449796,
"eval_NanoBEIR_mean_MaxSim_accuracy@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_accuracy@10": 0.8566666666666666,
"eval_NanoBEIR_mean_MaxSim_accuracy@3": 0.7533333333333334,
"eval_NanoBEIR_mean_MaxSim_accuracy@5": 0.7966666666666665,
"eval_NanoBEIR_mean_MaxSim_map@100": 0.5262103510898867,
"eval_NanoBEIR_mean_MaxSim_mrr@10": 0.6866547619047619,
"eval_NanoBEIR_mean_MaxSim_ndcg@10": 0.6006133143634821,
"eval_NanoBEIR_mean_MaxSim_precision@1": 0.5966666666666667,
"eval_NanoBEIR_mean_MaxSim_precision@10": 0.19633333333333333,
"eval_NanoBEIR_mean_MaxSim_precision@3": 0.3677777777777778,
"eval_NanoBEIR_mean_MaxSim_precision@5": 0.27999999999999997,
"eval_NanoBEIR_mean_MaxSim_recall@1": 0.30867220039326243,
"eval_NanoBEIR_mean_MaxSim_recall@10": 0.619513582099129,
"eval_NanoBEIR_mean_MaxSim_recall@3": 0.4806489965178266,
"eval_NanoBEIR_mean_MaxSim_recall@5": 0.5379534765131291,
"eval_NanoDBPedia_MaxSim_accuracy@1": 0.78,
"eval_NanoDBPedia_MaxSim_accuracy@10": 1.0,
"eval_NanoDBPedia_MaxSim_accuracy@3": 0.92,
"eval_NanoDBPedia_MaxSim_accuracy@5": 0.98,
"eval_NanoDBPedia_MaxSim_map@100": 0.5226380587911359,
"eval_NanoDBPedia_MaxSim_mrr@10": 0.8601904761904763,
"eval_NanoDBPedia_MaxSim_ndcg@10": 0.6719750956605776,
"eval_NanoDBPedia_MaxSim_precision@1": 0.78,
"eval_NanoDBPedia_MaxSim_precision@10": 0.552,
"eval_NanoDBPedia_MaxSim_precision@3": 0.6733333333333333,
"eval_NanoDBPedia_MaxSim_precision@5": 0.608,
"eval_NanoDBPedia_MaxSim_recall@1": 0.08078717061354299,
"eval_NanoDBPedia_MaxSim_recall@10": 0.3924306989439807,
"eval_NanoDBPedia_MaxSim_recall@3": 0.18515588386886442,
"eval_NanoDBPedia_MaxSim_recall@5": 0.2584589543168697,
"eval_NanoFiQA2018_MaxSim_accuracy@1": 0.48,
"eval_NanoFiQA2018_MaxSim_accuracy@10": 0.72,
"eval_NanoFiQA2018_MaxSim_accuracy@3": 0.68,
"eval_NanoFiQA2018_MaxSim_accuracy@5": 0.7,
"eval_NanoFiQA2018_MaxSim_map@100": 0.42052605899048506,
"eval_NanoFiQA2018_MaxSim_mrr@10": 0.5801904761904761,
"eval_NanoFiQA2018_MaxSim_ndcg@10": 0.48861441325613014,
"eval_NanoFiQA2018_MaxSim_precision@1": 0.48,
"eval_NanoFiQA2018_MaxSim_precision@10": 0.13,
"eval_NanoFiQA2018_MaxSim_precision@3": 0.3,
"eval_NanoFiQA2018_MaxSim_precision@5": 0.21599999999999997,
"eval_NanoFiQA2018_MaxSim_recall@1": 0.24257936507936506,
"eval_NanoFiQA2018_MaxSim_recall@10": 0.5499841269841269,
"eval_NanoFiQA2018_MaxSim_recall@3": 0.4490714285714285,
"eval_NanoFiQA2018_MaxSim_recall@5": 0.49059523809523803,
"eval_NanoHotpotQA_MaxSim_accuracy@1": 0.9,
"eval_NanoHotpotQA_MaxSim_accuracy@10": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@3": 1.0,
"eval_NanoHotpotQA_MaxSim_accuracy@5": 1.0,
"eval_NanoHotpotQA_MaxSim_map@100": 0.7669809034537017,
"eval_NanoHotpotQA_MaxSim_mrr@10": 0.9433333333333335,
"eval_NanoHotpotQA_MaxSim_ndcg@10": 0.8268658897142934,
"eval_NanoHotpotQA_MaxSim_precision@1": 0.9,
"eval_NanoHotpotQA_MaxSim_precision@10": 0.17,
"eval_NanoHotpotQA_MaxSim_precision@3": 0.5133333333333333,
"eval_NanoHotpotQA_MaxSim_precision@5": 0.32799999999999996,
"eval_NanoHotpotQA_MaxSim_recall@1": 0.45,
"eval_NanoHotpotQA_MaxSim_recall@10": 0.85,
"eval_NanoHotpotQA_MaxSim_recall@3": 0.77,
"eval_NanoHotpotQA_MaxSim_recall@5": 0.82,
"eval_NanoMSMARCO_MaxSim_accuracy@1": 0.44,
"eval_NanoMSMARCO_MaxSim_accuracy@10": 0.8,
"eval_NanoMSMARCO_MaxSim_accuracy@3": 0.64,
"eval_NanoMSMARCO_MaxSim_accuracy@5": 0.68,
"eval_NanoMSMARCO_MaxSim_map@100": 0.5604820061646906,
"eval_NanoMSMARCO_MaxSim_mrr@10": 0.5522222222222222,
"eval_NanoMSMARCO_MaxSim_ndcg@10": 0.6114841541262358,
"eval_NanoMSMARCO_MaxSim_precision@1": 0.44,
"eval_NanoMSMARCO_MaxSim_precision@10": 0.08,
"eval_NanoMSMARCO_MaxSim_precision@3": 0.21333333333333332,
"eval_NanoMSMARCO_MaxSim_precision@5": 0.136,
"eval_NanoMSMARCO_MaxSim_recall@1": 0.44,
"eval_NanoMSMARCO_MaxSim_recall@10": 0.8,
"eval_NanoMSMARCO_MaxSim_recall@3": 0.64,
"eval_NanoMSMARCO_MaxSim_recall@5": 0.68,
"eval_NanoNQ_MaxSim_accuracy@1": 0.56,
"eval_NanoNQ_MaxSim_accuracy@10": 0.82,
"eval_NanoNQ_MaxSim_accuracy@3": 0.68,
"eval_NanoNQ_MaxSim_accuracy@5": 0.78,
"eval_NanoNQ_MaxSim_map@100": 0.6433965160499178,
"eval_NanoNQ_MaxSim_mrr@10": 0.6473571428571429,
"eval_NanoNQ_MaxSim_ndcg@10": 0.6808803117635007,
"eval_NanoNQ_MaxSim_precision@1": 0.56,
"eval_NanoNQ_MaxSim_precision@10": 0.088,
"eval_NanoNQ_MaxSim_precision@3": 0.2333333333333333,
"eval_NanoNQ_MaxSim_precision@5": 0.16,
"eval_NanoNQ_MaxSim_recall@1": 0.55,
"eval_NanoNQ_MaxSim_recall@10": 0.8,
"eval_NanoNQ_MaxSim_recall@3": 0.67,
"eval_NanoNQ_MaxSim_recall@5": 0.74,
"eval_NanoSCIDOCS_MaxSim_accuracy@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_accuracy@10": 0.8,
"eval_NanoSCIDOCS_MaxSim_accuracy@3": 0.6,
"eval_NanoSCIDOCS_MaxSim_accuracy@5": 0.64,
"eval_NanoSCIDOCS_MaxSim_map@100": 0.24323856308938968,
"eval_NanoSCIDOCS_MaxSim_mrr@10": 0.5366349206349206,
"eval_NanoSCIDOCS_MaxSim_ndcg@10": 0.3238600216601547,
"eval_NanoSCIDOCS_MaxSim_precision@1": 0.42,
"eval_NanoSCIDOCS_MaxSim_precision@10": 0.158,
"eval_NanoSCIDOCS_MaxSim_precision@3": 0.2733333333333333,
"eval_NanoSCIDOCS_MaxSim_precision@5": 0.23199999999999998,
"eval_NanoSCIDOCS_MaxSim_recall@1": 0.08866666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@10": 0.3246666666666666,
"eval_NanoSCIDOCS_MaxSim_recall@3": 0.1696666666666667,
"eval_NanoSCIDOCS_MaxSim_recall@5": 0.23866666666666667,
"eval_runtime": 35.031,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 17000
}
],
"logging_steps": 100,
"max_steps": 27697,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 0.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}