trentmkelly commited on May 30

Commit

cc3fdd2

verified ·

1 Parent(s): e4d7003

Upload folder using huggingface_hub

Browse files

Files changed (18) hide show

README.md +27 -0
checkpoint-6970/config.json +35 -0
checkpoint-6970/model.safetensors +3 -0
checkpoint-6970/optimizer.pt +3 -0
checkpoint-6970/rng_state.pth +3 -0
checkpoint-6970/scheduler.pt +3 -0
checkpoint-6970/trainer_state.json +2014 -0
checkpoint-6970/training_args.bin +3 -0
config.json +35 -0
model.safetensors +3 -0
runs/May30_00-09-04_r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w/events.out.tfevents.1748563746.r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w.75.0 +2 -2
runs/May30_00-09-04_r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w/events.out.tfevents.1748564133.r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w.75.1 +3 -0
special_tokens_map.json +44 -0
tokenizer.json +0 -0
tokenizer_config.json +72 -0
training_args.bin +3 -0
training_params.json +30 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,27 @@

+---
+library_name: transformers
+tags:
+- autotrain
+- text-classification
+base_model: TaylorAI/gte-tiny
+widget:
+- text: "I love AutoTrain"
+---
+# Model Trained Using AutoTrain
+- Problem type: Text Classification
+## Validation Metrics
+loss: 0.04012129828333855
+f1: 0.9900353584056574
+precision: 0.9859154929577465
+recall: 0.9941897998708844
+auc: 0.999704926354536
+accuracy: 0.9899935442220787

checkpoint-6970/config.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "_name_or_path": "TaylorAI/gte-tiny",
+  "_num_labels": 2,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 384,
+  "id2label": {
+    "0": "human",
+    "1": "llm"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 1536,
+  "label2id": {
+    "human": 0,
+    "llm": 1
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

checkpoint-6970/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e1dc3603f7927d59bbb28381542e7c65f0c7d40444c17d18e2bdefc35a0d77c0
+size 90867952

checkpoint-6970/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:466ebe4983d35a27315b3f0ceb0db7dc49bf07e1a58d60bc6a063c7df30bf468
+size 181799994

checkpoint-6970/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:31c8269223c50fe95286007f63e5c42016e01d16bf3cea35eac7ea46df2bdee1
+size 14244

checkpoint-6970/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e941fa1b7d020c0e74b4c2944df4fa2d6c820122b3692afc92f145357c7443d
+size 1064

checkpoint-6970/trainer_state.json ADDED Viewed

	@@ -0,0 +1,2014 @@

+{
+  "best_metric": 0.04012129828333855,
+  "best_model_checkpoint": "slop-detector-mini/checkpoint-6970",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 6970,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.007173601147776184,
+      "grad_norm": 0.4645521938800812,
+      "learning_rate": 1.1950286806883365e-06,
+      "loss": 0.6918,
+      "step": 25
+    },
+    {
+      "epoch": 0.014347202295552367,
+      "grad_norm": 0.9209471940994263,
+      "learning_rate": 2.390057361376673e-06,
+      "loss": 0.6919,
+      "step": 50
+    },
+    {
+      "epoch": 0.021520803443328552,
+      "grad_norm": 0.5008063316345215,
+      "learning_rate": 3.58508604206501e-06,
+      "loss": 0.6918,
+      "step": 75
+    },
+    {
+      "epoch": 0.028694404591104734,
+      "grad_norm": 2.1300737857818604,
+      "learning_rate": 4.780114722753346e-06,
+      "loss": 0.6872,
+      "step": 100
+    },
+    {
+      "epoch": 0.035868005738880916,
+      "grad_norm": 0.9959478974342346,
+      "learning_rate": 5.9751434034416826e-06,
+      "loss": 0.6896,
+      "step": 125
+    },
+    {
+      "epoch": 0.043041606886657105,
+      "grad_norm": 1.5318769216537476,
+      "learning_rate": 7.17017208413002e-06,
+      "loss": 0.6838,
+      "step": 150
+    },
+    {
+      "epoch": 0.05021520803443329,
+      "grad_norm": 1.0408401489257812,
+      "learning_rate": 8.365200764818356e-06,
+      "loss": 0.6665,
+      "step": 175
+    },
+    {
+      "epoch": 0.05738880918220947,
+      "grad_norm": 1.6900608539581299,
+      "learning_rate": 9.560229445506692e-06,
+      "loss": 0.5941,
+      "step": 200
+    },
+    {
+      "epoch": 0.06456241032998565,
+      "grad_norm": 1.8240679502487183,
+      "learning_rate": 1.075525812619503e-05,
+      "loss": 0.4528,
+      "step": 225
+    },
+    {
+      "epoch": 0.07173601147776183,
+      "grad_norm": 9.910821914672852,
+      "learning_rate": 1.1950286806883365e-05,
+      "loss": 0.3188,
+      "step": 250
+    },
+    {
+      "epoch": 0.07890961262553801,
+      "grad_norm": 4.513535022735596,
+      "learning_rate": 1.3145315487571702e-05,
+      "loss": 0.292,
+      "step": 275
+    },
+    {
+      "epoch": 0.08608321377331421,
+      "grad_norm": 0.8180878162384033,
+      "learning_rate": 1.434034416826004e-05,
+      "loss": 0.1973,
+      "step": 300
+    },
+    {
+      "epoch": 0.09325681492109039,
+      "grad_norm": 0.6453915238380432,
+      "learning_rate": 1.5535372848948377e-05,
+      "loss": 0.1999,
+      "step": 325
+    },
+    {
+      "epoch": 0.10043041606886657,
+      "grad_norm": 1.2022216320037842,
+      "learning_rate": 1.6682600382409177e-05,
+      "loss": 0.155,
+      "step": 350
+    },
+    {
+      "epoch": 0.10760401721664276,
+      "grad_norm": 0.4976617693901062,
+      "learning_rate": 1.7877629063097516e-05,
+      "loss": 0.1583,
+      "step": 375
+    },
+    {
+      "epoch": 0.11477761836441894,
+      "grad_norm": 2.098670482635498,
+      "learning_rate": 1.9072657743785852e-05,
+      "loss": 0.1178,
+      "step": 400
+    },
+    {
+      "epoch": 0.12195121951219512,
+      "grad_norm": 0.7542682886123657,
+      "learning_rate": 2.0267686424474187e-05,
+      "loss": 0.169,
+      "step": 425
+    },
+    {
+      "epoch": 0.1291248206599713,
+      "grad_norm": 10.018378257751465,
+      "learning_rate": 2.1414913957934994e-05,
+      "loss": 0.1356,
+      "step": 450
+    },
+    {
+      "epoch": 0.13629842180774748,
+      "grad_norm": 34.80171203613281,
+      "learning_rate": 2.2609942638623326e-05,
+      "loss": 0.1258,
+      "step": 475
+    },
+    {
+      "epoch": 0.14347202295552366,
+      "grad_norm": 0.1728999763727188,
+      "learning_rate": 2.3804971319311666e-05,
+      "loss": 0.0863,
+      "step": 500
+    },
+    {
+      "epoch": 0.15064562410329985,
+      "grad_norm": 0.1769145131111145,
+      "learning_rate": 2.5e-05,
+      "loss": 0.1017,
+      "step": 525
+    },
+    {
+      "epoch": 0.15781922525107603,
+      "grad_norm": 6.390002250671387,
+      "learning_rate": 2.6195028680688337e-05,
+      "loss": 0.0829,
+      "step": 550
+    },
+    {
+      "epoch": 0.1649928263988522,
+      "grad_norm": 0.13392409682273865,
+      "learning_rate": 2.7390057361376676e-05,
+      "loss": 0.0991,
+      "step": 575
+    },
+    {
+      "epoch": 0.17216642754662842,
+      "grad_norm": 9.020365715026855,
+      "learning_rate": 2.853728489483748e-05,
+      "loss": 0.1088,
+      "step": 600
+    },
+    {
+      "epoch": 0.1793400286944046,
+      "grad_norm": 0.17115327715873718,
+      "learning_rate": 2.9732313575525815e-05,
+      "loss": 0.0858,
+      "step": 625
+    },
+    {
+      "epoch": 0.18651362984218078,
+      "grad_norm": 0.1999664157629013,
+      "learning_rate": 3.092734225621415e-05,
+      "loss": 0.1257,
+      "step": 650
+    },
+    {
+      "epoch": 0.19368723098995697,
+      "grad_norm": 0.10073782503604889,
+      "learning_rate": 3.2122370936902486e-05,
+      "loss": 0.0434,
+      "step": 675
+    },
+    {
+      "epoch": 0.20086083213773315,
+      "grad_norm": 14.117579460144043,
+      "learning_rate": 3.331739961759082e-05,
+      "loss": 0.169,
+      "step": 700
+    },
+    {
+      "epoch": 0.20803443328550933,
+      "grad_norm": 48.392974853515625,
+      "learning_rate": 3.451242829827916e-05,
+      "loss": 0.0908,
+      "step": 725
+    },
+    {
+      "epoch": 0.2152080344332855,
+      "grad_norm": 0.10534697771072388,
+      "learning_rate": 3.570745697896749e-05,
+      "loss": 0.1517,
+      "step": 750
+    },
+    {
+      "epoch": 0.2223816355810617,
+      "grad_norm": 0.07163497805595398,
+      "learning_rate": 3.6902485659655836e-05,
+      "loss": 0.054,
+      "step": 775
+    },
+    {
+      "epoch": 0.22955523672883787,
+      "grad_norm": 0.0702139139175415,
+      "learning_rate": 3.809751434034417e-05,
+      "loss": 0.1009,
+      "step": 800
+    },
+    {
+      "epoch": 0.23672883787661406,
+      "grad_norm": 0.698357105255127,
+      "learning_rate": 3.929254302103251e-05,
+      "loss": 0.0344,
+      "step": 825
+    },
+    {
+      "epoch": 0.24390243902439024,
+      "grad_norm": 0.05920593440532684,
+      "learning_rate": 4.048757170172084e-05,
+      "loss": 0.104,
+      "step": 850
+    },
+    {
+      "epoch": 0.25107604017216645,
+      "grad_norm": 0.08545070886611938,
+      "learning_rate": 4.168260038240918e-05,
+      "loss": 0.1973,
+      "step": 875
+    },
+    {
+      "epoch": 0.2582496413199426,
+      "grad_norm": 29.820629119873047,
+      "learning_rate": 4.287762906309752e-05,
+      "loss": 0.1245,
+      "step": 900
+    },
+    {
+      "epoch": 0.2654232424677188,
+      "grad_norm": 18.92865562438965,
+      "learning_rate": 4.4072657743785856e-05,
+      "loss": 0.1508,
+      "step": 925
+    },
+    {
+      "epoch": 0.27259684361549497,
+      "grad_norm": 3.224970579147339,
+      "learning_rate": 4.5267686424474185e-05,
+      "loss": 0.0772,
+      "step": 950
+    },
+    {
+      "epoch": 0.2797704447632712,
+      "grad_norm": 56.050315856933594,
+      "learning_rate": 4.646271510516252e-05,
+      "loss": 0.0839,
+      "step": 975
+    },
+    {
+      "epoch": 0.28694404591104733,
+      "grad_norm": 45.18210983276367,
+      "learning_rate": 4.7657743785850863e-05,
+      "loss": 0.1926,
+      "step": 1000
+    },
+    {
+      "epoch": 0.29411764705882354,
+      "grad_norm": 0.06930357962846756,
+      "learning_rate": 4.88527724665392e-05,
+      "loss": 0.1326,
+      "step": 1025
+    },
+    {
+      "epoch": 0.3012912482065997,
+      "grad_norm": 0.05295657739043236,
+      "learning_rate": 4.9994685938994586e-05,
+      "loss": 0.0758,
+      "step": 1050
+    },
+    {
+      "epoch": 0.3084648493543759,
+      "grad_norm": 21.23689842224121,
+      "learning_rate": 4.986183441385907e-05,
+      "loss": 0.0863,
+      "step": 1075
+    },
+    {
+      "epoch": 0.31563845050215206,
+      "grad_norm": 55.6703987121582,
+      "learning_rate": 4.9728982888723565e-05,
+      "loss": 0.1115,
+      "step": 1100
+    },
+    {
+      "epoch": 0.32281205164992827,
+      "grad_norm": 0.04365883022546768,
+      "learning_rate": 4.9596131363588055e-05,
+      "loss": 0.0404,
+      "step": 1125
+    },
+    {
+      "epoch": 0.3299856527977044,
+      "grad_norm": 0.033937107771635056,
+      "learning_rate": 4.9463279838452545e-05,
+      "loss": 0.0963,
+      "step": 1150
+    },
+    {
+      "epoch": 0.33715925394548063,
+      "grad_norm": 0.049055054783821106,
+      "learning_rate": 4.933042831331704e-05,
+      "loss": 0.0539,
+      "step": 1175
+    },
+    {
+      "epoch": 0.34433285509325684,
+      "grad_norm": 0.038862813264131546,
+      "learning_rate": 4.919757678818153e-05,
+      "loss": 0.0102,
+      "step": 1200
+    },
+    {
+      "epoch": 0.351506456241033,
+      "grad_norm": 0.0405915193259716,
+      "learning_rate": 4.906472526304603e-05,
+      "loss": 0.0745,
+      "step": 1225
+    },
+    {
+      "epoch": 0.3586800573888092,
+      "grad_norm": 0.05233052000403404,
+      "learning_rate": 4.893187373791052e-05,
+      "loss": 0.0743,
+      "step": 1250
+    },
+    {
+      "epoch": 0.36585365853658536,
+      "grad_norm": 0.037946607917547226,
+      "learning_rate": 4.8799022212775e-05,
+      "loss": 0.0348,
+      "step": 1275
+    },
+    {
+      "epoch": 0.37302725968436157,
+      "grad_norm": 0.031401779502630234,
+      "learning_rate": 4.8666170687639496e-05,
+      "loss": 0.0385,
+      "step": 1300
+    },
+    {
+      "epoch": 0.3802008608321377,
+      "grad_norm": 0.04547421261668205,
+      "learning_rate": 4.8533319162503986e-05,
+      "loss": 0.1143,
+      "step": 1325
+    },
+    {
+      "epoch": 0.38737446197991393,
+      "grad_norm": 0.05827297270298004,
+      "learning_rate": 4.840046763736848e-05,
+      "loss": 0.0772,
+      "step": 1350
+    },
+    {
+      "epoch": 0.3945480631276901,
+      "grad_norm": 0.08565480262041092,
+      "learning_rate": 4.826761611223297e-05,
+      "loss": 0.1192,
+      "step": 1375
+    },
+    {
+      "epoch": 0.4017216642754663,
+      "grad_norm": 0.03007586859166622,
+      "learning_rate": 4.813476458709746e-05,
+      "loss": 0.0613,
+      "step": 1400
+    },
+    {
+      "epoch": 0.40889526542324245,
+      "grad_norm": 0.027408963069319725,
+      "learning_rate": 4.800191306196196e-05,
+      "loss": 0.0029,
+      "step": 1425
+    },
+    {
+      "epoch": 0.41606886657101866,
+      "grad_norm": 0.028056548908352852,
+      "learning_rate": 4.786906153682644e-05,
+      "loss": 0.0902,
+      "step": 1450
+    },
+    {
+      "epoch": 0.4232424677187948,
+      "grad_norm": 0.08005893230438232,
+      "learning_rate": 4.773621001169094e-05,
+      "loss": 0.1209,
+      "step": 1475
+    },
+    {
+      "epoch": 0.430416068866571,
+      "grad_norm": 0.06766340136528015,
+      "learning_rate": 4.760335848655543e-05,
+      "loss": 0.0201,
+      "step": 1500
+    },
+    {
+      "epoch": 0.4375896700143472,
+      "grad_norm": 0.03779875114560127,
+      "learning_rate": 4.747050696141992e-05,
+      "loss": 0.0622,
+      "step": 1525
+    },
+    {
+      "epoch": 0.4447632711621234,
+      "grad_norm": 0.03687926381826401,
+      "learning_rate": 4.7337655436284414e-05,
+      "loss": 0.121,
+      "step": 1550
+    },
+    {
+      "epoch": 0.4519368723098996,
+      "grad_norm": 0.03594242036342621,
+      "learning_rate": 4.7204803911148904e-05,
+      "loss": 0.1053,
+      "step": 1575
+    },
+    {
+      "epoch": 0.45911047345767575,
+      "grad_norm": 0.03990463539958,
+      "learning_rate": 4.707195238601339e-05,
+      "loss": 0.0571,
+      "step": 1600
+    },
+    {
+      "epoch": 0.46628407460545196,
+      "grad_norm": 0.04624362289905548,
+      "learning_rate": 4.693910086087788e-05,
+      "loss": 0.1129,
+      "step": 1625
+    },
+    {
+      "epoch": 0.4734576757532281,
+      "grad_norm": 0.035806916654109955,
+      "learning_rate": 4.680624933574237e-05,
+      "loss": 0.0464,
+      "step": 1650
+    },
+    {
+      "epoch": 0.4806312769010043,
+      "grad_norm": 4.62434720993042,
+      "learning_rate": 4.667339781060687e-05,
+      "loss": 0.052,
+      "step": 1675
+    },
+    {
+      "epoch": 0.4878048780487805,
+      "grad_norm": 0.028078608214855194,
+      "learning_rate": 4.654054628547136e-05,
+      "loss": 0.1337,
+      "step": 1700
+    },
+    {
+      "epoch": 0.4949784791965567,
+      "grad_norm": 0.029056400060653687,
+      "learning_rate": 4.640769476033585e-05,
+      "loss": 0.0727,
+      "step": 1725
+    },
+    {
+      "epoch": 0.5021520803443329,
+      "grad_norm": 0.021900108084082603,
+      "learning_rate": 4.6274843235200345e-05,
+      "loss": 0.0704,
+      "step": 1750
+    },
+    {
+      "epoch": 0.509325681492109,
+      "grad_norm": 0.019067928194999695,
+      "learning_rate": 4.6141991710064835e-05,
+      "loss": 0.0147,
+      "step": 1775
+    },
+    {
+      "epoch": 0.5164992826398852,
+      "grad_norm": 54.136009216308594,
+      "learning_rate": 4.6009140184929324e-05,
+      "loss": 0.1138,
+      "step": 1800
+    },
+    {
+      "epoch": 0.5236728837876614,
+      "grad_norm": 0.030056435614824295,
+      "learning_rate": 4.5876288659793814e-05,
+      "loss": 0.0791,
+      "step": 1825
+    },
+    {
+      "epoch": 0.5308464849354376,
+      "grad_norm": 0.022308100014925003,
+      "learning_rate": 4.5743437134658304e-05,
+      "loss": 0.0643,
+      "step": 1850
+    },
+    {
+      "epoch": 0.5380200860832137,
+      "grad_norm": 0.13602350652217865,
+      "learning_rate": 4.56105856095228e-05,
+      "loss": 0.0891,
+      "step": 1875
+    },
+    {
+      "epoch": 0.5451936872309899,
+      "grad_norm": 2.2635345458984375,
+      "learning_rate": 4.547773408438729e-05,
+      "loss": 0.0951,
+      "step": 1900
+    },
+    {
+      "epoch": 0.5523672883787661,
+      "grad_norm": 0.02811610698699951,
+      "learning_rate": 4.5344882559251787e-05,
+      "loss": 0.0116,
+      "step": 1925
+    },
+    {
+      "epoch": 0.5595408895265424,
+      "grad_norm": 0.02545151859521866,
+      "learning_rate": 4.5212031034116276e-05,
+      "loss": 0.0335,
+      "step": 1950
+    },
+    {
+      "epoch": 0.5667144906743186,
+      "grad_norm": 0.20565590262413025,
+      "learning_rate": 4.5079179508980766e-05,
+      "loss": 0.1518,
+      "step": 1975
+    },
+    {
+      "epoch": 0.5738880918220947,
+      "grad_norm": 26.854698181152344,
+      "learning_rate": 4.4946327983845256e-05,
+      "loss": 0.0928,
+      "step": 2000
+    },
+    {
+      "epoch": 0.5810616929698709,
+      "grad_norm": 0.28100213408470154,
+      "learning_rate": 4.4813476458709745e-05,
+      "loss": 0.0961,
+      "step": 2025
+    },
+    {
+      "epoch": 0.5882352941176471,
+      "grad_norm": 0.020814087241888046,
+      "learning_rate": 4.468062493357424e-05,
+      "loss": 0.0564,
+      "step": 2050
+    },
+    {
+      "epoch": 0.5954088952654233,
+      "grad_norm": 0.019664647057652473,
+      "learning_rate": 4.454777340843873e-05,
+      "loss": 0.0344,
+      "step": 2075
+    },
+    {
+      "epoch": 0.6025824964131994,
+      "grad_norm": 0.11771227419376373,
+      "learning_rate": 4.441492188330322e-05,
+      "loss": 0.1018,
+      "step": 2100
+    },
+    {
+      "epoch": 0.6097560975609756,
+      "grad_norm": 0.3748355209827423,
+      "learning_rate": 4.428207035816772e-05,
+      "loss": 0.1281,
+      "step": 2125
+    },
+    {
+      "epoch": 0.6169296987087518,
+      "grad_norm": 0.02155977115035057,
+      "learning_rate": 4.414921883303221e-05,
+      "loss": 0.0264,
+      "step": 2150
+    },
+    {
+      "epoch": 0.624103299856528,
+      "grad_norm": 0.017244333401322365,
+      "learning_rate": 4.40163673078967e-05,
+      "loss": 0.0611,
+      "step": 2175
+    },
+    {
+      "epoch": 0.6312769010043041,
+      "grad_norm": 0.014310152269899845,
+      "learning_rate": 4.388351578276119e-05,
+      "loss": 0.0444,
+      "step": 2200
+    },
+    {
+      "epoch": 0.6384505021520803,
+      "grad_norm": 0.015014859847724438,
+      "learning_rate": 4.375066425762568e-05,
+      "loss": 0.0199,
+      "step": 2225
+    },
+    {
+      "epoch": 0.6456241032998565,
+      "grad_norm": 0.028923267498612404,
+      "learning_rate": 4.361781273249017e-05,
+      "loss": 0.0668,
+      "step": 2250
+    },
+    {
+      "epoch": 0.6527977044476327,
+      "grad_norm": 0.017175152897834778,
+      "learning_rate": 4.348496120735466e-05,
+      "loss": 0.0333,
+      "step": 2275
+    },
+    {
+      "epoch": 0.6599713055954088,
+      "grad_norm": 0.018409280106425285,
+      "learning_rate": 4.335210968221915e-05,
+      "loss": 0.1059,
+      "step": 2300
+    },
+    {
+      "epoch": 0.667144906743185,
+      "grad_norm": 0.019378701224923134,
+      "learning_rate": 4.321925815708365e-05,
+      "loss": 0.0403,
+      "step": 2325
+    },
+    {
+      "epoch": 0.6743185078909613,
+      "grad_norm": 0.015860414132475853,
+      "learning_rate": 4.308640663194813e-05,
+      "loss": 0.0929,
+      "step": 2350
+    },
+    {
+      "epoch": 0.6814921090387375,
+      "grad_norm": 0.01943328231573105,
+      "learning_rate": 4.295355510681263e-05,
+      "loss": 0.0014,
+      "step": 2375
+    },
+    {
+      "epoch": 0.6886657101865137,
+      "grad_norm": 0.4460265040397644,
+      "learning_rate": 4.282070358167712e-05,
+      "loss": 0.0233,
+      "step": 2400
+    },
+    {
+      "epoch": 0.6958393113342898,
+      "grad_norm": 0.013770678080618382,
+      "learning_rate": 4.268785205654161e-05,
+      "loss": 0.0438,
+      "step": 2425
+    },
+    {
+      "epoch": 0.703012912482066,
+      "grad_norm": 0.466856986284256,
+      "learning_rate": 4.2555000531406104e-05,
+      "loss": 0.0331,
+      "step": 2450
+    },
+    {
+      "epoch": 0.7101865136298422,
+      "grad_norm": 0.05924264341592789,
+      "learning_rate": 4.2422149006270594e-05,
+      "loss": 0.0502,
+      "step": 2475
+    },
+    {
+      "epoch": 0.7173601147776184,
+      "grad_norm": 2.5010907649993896,
+      "learning_rate": 4.228929748113509e-05,
+      "loss": 0.0245,
+      "step": 2500
+    },
+    {
+      "epoch": 0.7245337159253945,
+      "grad_norm": 0.011777346953749657,
+      "learning_rate": 4.215644595599958e-05,
+      "loss": 0.0585,
+      "step": 2525
+    },
+    {
+      "epoch": 0.7317073170731707,
+      "grad_norm": 0.021891452372074127,
+      "learning_rate": 4.202359443086406e-05,
+      "loss": 0.1348,
+      "step": 2550
+    },
+    {
+      "epoch": 0.7388809182209469,
+      "grad_norm": 0.011559663340449333,
+      "learning_rate": 4.189074290572856e-05,
+      "loss": 0.0781,
+      "step": 2575
+    },
+    {
+      "epoch": 0.7460545193687231,
+      "grad_norm": 0.011871904134750366,
+      "learning_rate": 4.175789138059305e-05,
+      "loss": 0.1001,
+      "step": 2600
+    },
+    {
+      "epoch": 0.7532281205164992,
+      "grad_norm": 0.011486608535051346,
+      "learning_rate": 4.1625039855457546e-05,
+      "loss": 0.036,
+      "step": 2625
+    },
+    {
+      "epoch": 0.7604017216642754,
+      "grad_norm": 0.03866451606154442,
+      "learning_rate": 4.1492188330322036e-05,
+      "loss": 0.0781,
+      "step": 2650
+    },
+    {
+      "epoch": 0.7675753228120517,
+      "grad_norm": 0.04854358360171318,
+      "learning_rate": 4.1359336805186525e-05,
+      "loss": 0.018,
+      "step": 2675
+    },
+    {
+      "epoch": 0.7747489239598279,
+      "grad_norm": 26.049694061279297,
+      "learning_rate": 4.122648528005102e-05,
+      "loss": 0.1062,
+      "step": 2700
+    },
+    {
+      "epoch": 0.7819225251076041,
+      "grad_norm": 0.09440884739160538,
+      "learning_rate": 4.1093633754915505e-05,
+      "loss": 0.0293,
+      "step": 2725
+    },
+    {
+      "epoch": 0.7890961262553802,
+      "grad_norm": 0.008743391372263432,
+      "learning_rate": 4.096078222978e-05,
+      "loss": 0.1154,
+      "step": 2750
+    },
+    {
+      "epoch": 0.7962697274031564,
+      "grad_norm": 0.0563165545463562,
+      "learning_rate": 4.082793070464449e-05,
+      "loss": 0.0505,
+      "step": 2775
+    },
+    {
+      "epoch": 0.8034433285509326,
+      "grad_norm": 0.031961794942617416,
+      "learning_rate": 4.069507917950898e-05,
+      "loss": 0.0698,
+      "step": 2800
+    },
+    {
+      "epoch": 0.8106169296987088,
+      "grad_norm": 0.013981098309159279,
+      "learning_rate": 4.056222765437348e-05,
+      "loss": 0.0531,
+      "step": 2825
+    },
+    {
+      "epoch": 0.8177905308464849,
+      "grad_norm": 0.016712762415409088,
+      "learning_rate": 4.042937612923797e-05,
+      "loss": 0.0847,
+      "step": 2850
+    },
+    {
+      "epoch": 0.8249641319942611,
+      "grad_norm": 46.247108459472656,
+      "learning_rate": 4.0296524604102456e-05,
+      "loss": 0.0463,
+      "step": 2875
+    },
+    {
+      "epoch": 0.8321377331420373,
+      "grad_norm": 31.703798294067383,
+      "learning_rate": 4.0163673078966946e-05,
+      "loss": 0.0719,
+      "step": 2900
+    },
+    {
+      "epoch": 0.8393113342898135,
+      "grad_norm": 0.010652084834873676,
+      "learning_rate": 4.0030821553831436e-05,
+      "loss": 0.0805,
+      "step": 2925
+    },
+    {
+      "epoch": 0.8464849354375896,
+      "grad_norm": 0.00876002386212349,
+      "learning_rate": 3.989797002869593e-05,
+      "loss": 0.0358,
+      "step": 2950
+    },
+    {
+      "epoch": 0.8536585365853658,
+      "grad_norm": 0.042157307267189026,
+      "learning_rate": 3.976511850356042e-05,
+      "loss": 0.0322,
+      "step": 2975
+    },
+    {
+      "epoch": 0.860832137733142,
+      "grad_norm": 0.01021247822791338,
+      "learning_rate": 3.963226697842491e-05,
+      "loss": 0.0437,
+      "step": 3000
+    },
+    {
+      "epoch": 0.8680057388809183,
+      "grad_norm": 0.010883198119699955,
+      "learning_rate": 3.949941545328941e-05,
+      "loss": 0.0059,
+      "step": 3025
+    },
+    {
+      "epoch": 0.8751793400286944,
+      "grad_norm": 0.006532243452966213,
+      "learning_rate": 3.93665639281539e-05,
+      "loss": 0.0149,
+      "step": 3050
+    },
+    {
+      "epoch": 0.8823529411764706,
+      "grad_norm": 0.006005235482007265,
+      "learning_rate": 3.9233712403018394e-05,
+      "loss": 0.0036,
+      "step": 3075
+    },
+    {
+      "epoch": 0.8895265423242468,
+      "grad_norm": 0.0063223764300346375,
+      "learning_rate": 3.910086087788288e-05,
+      "loss": 0.0095,
+      "step": 3100
+    },
+    {
+      "epoch": 0.896700143472023,
+      "grad_norm": 0.009072021581232548,
+      "learning_rate": 3.896800935274737e-05,
+      "loss": 0.0004,
+      "step": 3125
+    },
+    {
+      "epoch": 0.9038737446197992,
+      "grad_norm": 0.05379496142268181,
+      "learning_rate": 3.8835157827611864e-05,
+      "loss": 0.1547,
+      "step": 3150
+    },
+    {
+      "epoch": 0.9110473457675753,
+      "grad_norm": 0.013865516521036625,
+      "learning_rate": 3.870230630247635e-05,
+      "loss": 0.0036,
+      "step": 3175
+    },
+    {
+      "epoch": 0.9182209469153515,
+      "grad_norm": 0.010529842227697372,
+      "learning_rate": 3.856945477734085e-05,
+      "loss": 0.0344,
+      "step": 3200
+    },
+    {
+      "epoch": 0.9253945480631277,
+      "grad_norm": 0.014116561971604824,
+      "learning_rate": 3.843660325220534e-05,
+      "loss": 0.123,
+      "step": 3225
+    },
+    {
+      "epoch": 0.9325681492109039,
+      "grad_norm": 0.0235675647854805,
+      "learning_rate": 3.830375172706983e-05,
+      "loss": 0.0471,
+      "step": 3250
+    },
+    {
+      "epoch": 0.93974175035868,
+      "grad_norm": 0.07236867398023605,
+      "learning_rate": 3.817090020193432e-05,
+      "loss": 0.0576,
+      "step": 3275
+    },
+    {
+      "epoch": 0.9469153515064562,
+      "grad_norm": 0.008477970026433468,
+      "learning_rate": 3.803804867679881e-05,
+      "loss": 0.0656,
+      "step": 3300
+    },
+    {
+      "epoch": 0.9540889526542324,
+      "grad_norm": 0.009889235720038414,
+      "learning_rate": 3.7905197151663305e-05,
+      "loss": 0.0141,
+      "step": 3325
+    },
+    {
+      "epoch": 0.9612625538020086,
+      "grad_norm": 0.04827851429581642,
+      "learning_rate": 3.7772345626527795e-05,
+      "loss": 0.2139,
+      "step": 3350
+    },
+    {
+      "epoch": 0.9684361549497847,
+      "grad_norm": 0.022464429959654808,
+      "learning_rate": 3.7639494101392285e-05,
+      "loss": 0.0343,
+      "step": 3375
+    },
+    {
+      "epoch": 0.975609756097561,
+      "grad_norm": 0.02515058033168316,
+      "learning_rate": 3.750664257625678e-05,
+      "loss": 0.0389,
+      "step": 3400
+    },
+    {
+      "epoch": 0.9827833572453372,
+      "grad_norm": 0.04209022969007492,
+      "learning_rate": 3.737379105112127e-05,
+      "loss": 0.0556,
+      "step": 3425
+    },
+    {
+      "epoch": 0.9899569583931134,
+      "grad_norm": 0.025623561814427376,
+      "learning_rate": 3.724093952598576e-05,
+      "loss": 0.11,
+      "step": 3450
+    },
+    {
+      "epoch": 0.9971305595408895,
+      "grad_norm": 0.044107332825660706,
+      "learning_rate": 3.710808800085025e-05,
+      "loss": 0.0703,
+      "step": 3475
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9874112330535829,
+      "eval_auc": 0.9992416857373987,
+      "eval_f1": 0.9875120076849183,
+      "eval_loss": 0.0463985949754715,
+      "eval_precision": 0.9796696315120712,
+      "eval_recall": 0.9954809554551324,
+      "eval_runtime": 4.3248,
+      "eval_samples_per_second": 716.333,
+      "eval_steps_per_second": 44.857,
+      "step": 3485
+    },
+    {
+      "epoch": 1.0043041606886658,
+      "grad_norm": 0.006846719887107611,
+      "learning_rate": 3.697523647571474e-05,
+      "loss": 0.009,
+      "step": 3500
+    },
+    {
+      "epoch": 1.011477761836442,
+      "grad_norm": 3.4670445919036865,
+      "learning_rate": 3.6842384950579236e-05,
+      "loss": 0.034,
+      "step": 3525
+    },
+    {
+      "epoch": 1.018651362984218,
+      "grad_norm": 14.726991653442383,
+      "learning_rate": 3.6709533425443726e-05,
+      "loss": 0.0348,
+      "step": 3550
+    },
+    {
+      "epoch": 1.0258249641319943,
+      "grad_norm": 0.01886272057890892,
+      "learning_rate": 3.6576681900308216e-05,
+      "loss": 0.045,
+      "step": 3575
+    },
+    {
+      "epoch": 1.0329985652797704,
+      "grad_norm": 0.04845844581723213,
+      "learning_rate": 3.644383037517271e-05,
+      "loss": 0.0386,
+      "step": 3600
+    },
+    {
+      "epoch": 1.0401721664275467,
+      "grad_norm": 0.04974396526813507,
+      "learning_rate": 3.63109788500372e-05,
+      "loss": 0.0336,
+      "step": 3625
+    },
+    {
+      "epoch": 1.0473457675753228,
+      "grad_norm": 0.009641916491091251,
+      "learning_rate": 3.617812732490169e-05,
+      "loss": 0.0118,
+      "step": 3650
+    },
+    {
+      "epoch": 1.054519368723099,
+      "grad_norm": 0.008313027210533619,
+      "learning_rate": 3.604527579976618e-05,
+      "loss": 0.0005,
+      "step": 3675
+    },
+    {
+      "epoch": 1.0616929698708752,
+      "grad_norm": 0.6244511008262634,
+      "learning_rate": 3.591242427463067e-05,
+      "loss": 0.0308,
+      "step": 3700
+    },
+    {
+      "epoch": 1.0688665710186513,
+      "grad_norm": 0.004019048996269703,
+      "learning_rate": 3.577957274949517e-05,
+      "loss": 0.03,
+      "step": 3725
+    },
+    {
+      "epoch": 1.0760401721664274,
+      "grad_norm": 0.0038138478994369507,
+      "learning_rate": 3.564672122435966e-05,
+      "loss": 0.0004,
+      "step": 3750
+    },
+    {
+      "epoch": 1.0832137733142038,
+      "grad_norm": 0.005525535438209772,
+      "learning_rate": 3.5513869699224154e-05,
+      "loss": 0.0003,
+      "step": 3775
+    },
+    {
+      "epoch": 1.0903873744619799,
+      "grad_norm": 0.004180921241641045,
+      "learning_rate": 3.5381018174088643e-05,
+      "loss": 0.0003,
+      "step": 3800
+    },
+    {
+      "epoch": 1.0975609756097562,
+      "grad_norm": 0.004629930946975946,
+      "learning_rate": 3.5248166648953126e-05,
+      "loss": 0.1079,
+      "step": 3825
+    },
+    {
+      "epoch": 1.1047345767575323,
+      "grad_norm": 0.008479510433971882,
+      "learning_rate": 3.511531512381762e-05,
+      "loss": 0.0788,
+      "step": 3850
+    },
+    {
+      "epoch": 1.1119081779053084,
+      "grad_norm": 0.007632472552359104,
+      "learning_rate": 3.498246359868211e-05,
+      "loss": 0.0008,
+      "step": 3875
+    },
+    {
+      "epoch": 1.1190817790530847,
+      "grad_norm": 0.009593753144145012,
+      "learning_rate": 3.484961207354661e-05,
+      "loss": 0.0006,
+      "step": 3900
+    },
+    {
+      "epoch": 1.1262553802008608,
+      "grad_norm": 0.00635389843955636,
+      "learning_rate": 3.47167605484111e-05,
+      "loss": 0.0659,
+      "step": 3925
+    },
+    {
+      "epoch": 1.133428981348637,
+      "grad_norm": 0.005174864083528519,
+      "learning_rate": 3.458390902327559e-05,
+      "loss": 0.0007,
+      "step": 3950
+    },
+    {
+      "epoch": 1.1406025824964132,
+      "grad_norm": 0.0196967925876379,
+      "learning_rate": 3.4451057498140085e-05,
+      "loss": 0.028,
+      "step": 3975
+    },
+    {
+      "epoch": 1.1477761836441893,
+      "grad_norm": 0.0053730374202132225,
+      "learning_rate": 3.431820597300457e-05,
+      "loss": 0.0044,
+      "step": 4000
+    },
+    {
+      "epoch": 1.1549497847919656,
+      "grad_norm": 0.016190949827432632,
+      "learning_rate": 3.4185354447869064e-05,
+      "loss": 0.0034,
+      "step": 4025
+    },
+    {
+      "epoch": 1.1621233859397417,
+      "grad_norm": 0.06172305718064308,
+      "learning_rate": 3.4052502922733554e-05,
+      "loss": 0.045,
+      "step": 4050
+    },
+    {
+      "epoch": 1.169296987087518,
+      "grad_norm": 0.005435667000710964,
+      "learning_rate": 3.3919651397598044e-05,
+      "loss": 0.0006,
+      "step": 4075
+    },
+    {
+      "epoch": 1.1764705882352942,
+      "grad_norm": 0.0059057194739580154,
+      "learning_rate": 3.378679987246254e-05,
+      "loss": 0.0006,
+      "step": 4100
+    },
+    {
+      "epoch": 1.1836441893830703,
+      "grad_norm": 0.003536668373271823,
+      "learning_rate": 3.365394834732703e-05,
+      "loss": 0.0002,
+      "step": 4125
+    },
+    {
+      "epoch": 1.1908177905308466,
+      "grad_norm": 0.013157457113265991,
+      "learning_rate": 3.352109682219152e-05,
+      "loss": 0.0712,
+      "step": 4150
+    },
+    {
+      "epoch": 1.1979913916786227,
+      "grad_norm": 0.05286416783928871,
+      "learning_rate": 3.3388245297056016e-05,
+      "loss": 0.0032,
+      "step": 4175
+    },
+    {
+      "epoch": 1.2051649928263988,
+      "grad_norm": 0.007331141736358404,
+      "learning_rate": 3.32553937719205e-05,
+      "loss": 0.1212,
+      "step": 4200
+    },
+    {
+      "epoch": 1.212338593974175,
+      "grad_norm": 0.01495648454874754,
+      "learning_rate": 3.3122542246784996e-05,
+      "loss": 0.0026,
+      "step": 4225
+    },
+    {
+      "epoch": 1.2195121951219512,
+      "grad_norm": 0.014520620927214622,
+      "learning_rate": 3.2989690721649485e-05,
+      "loss": 0.011,
+      "step": 4250
+    },
+    {
+      "epoch": 1.2266857962697273,
+      "grad_norm": 0.0068002501502633095,
+      "learning_rate": 3.2856839196513975e-05,
+      "loss": 0.0007,
+      "step": 4275
+    },
+    {
+      "epoch": 1.2338593974175036,
+      "grad_norm": 0.004121303092688322,
+      "learning_rate": 3.272398767137847e-05,
+      "loss": 0.0313,
+      "step": 4300
+    },
+    {
+      "epoch": 1.2410329985652797,
+      "grad_norm": 0.005836965050548315,
+      "learning_rate": 3.259113614624296e-05,
+      "loss": 0.0105,
+      "step": 4325
+    },
+    {
+      "epoch": 1.248206599713056,
+      "grad_norm": 0.004592243582010269,
+      "learning_rate": 3.245828462110745e-05,
+      "loss": 0.0002,
+      "step": 4350
+    },
+    {
+      "epoch": 1.2553802008608321,
+      "grad_norm": 0.01724414713680744,
+      "learning_rate": 3.2330747156977364e-05,
+      "loss": 0.1373,
+      "step": 4375
+    },
+    {
+      "epoch": 1.2625538020086085,
+      "grad_norm": 0.011967150494456291,
+      "learning_rate": 3.2197895631841854e-05,
+      "loss": 0.0277,
+      "step": 4400
+    },
+    {
+      "epoch": 1.2697274031563845,
+      "grad_norm": 0.689711332321167,
+      "learning_rate": 3.206504410670635e-05,
+      "loss": 0.0309,
+      "step": 4425
+    },
+    {
+      "epoch": 1.2769010043041606,
+      "grad_norm": 0.003829318331554532,
+      "learning_rate": 3.193219258157083e-05,
+      "loss": 0.0005,
+      "step": 4450
+    },
+    {
+      "epoch": 1.284074605451937,
+      "grad_norm": 0.005293109454214573,
+      "learning_rate": 3.179934105643533e-05,
+      "loss": 0.0449,
+      "step": 4475
+    },
+    {
+      "epoch": 1.291248206599713,
+      "grad_norm": 0.005219063721597195,
+      "learning_rate": 3.166648953129982e-05,
+      "loss": 0.0398,
+      "step": 4500
+    },
+    {
+      "epoch": 1.2984218077474892,
+      "grad_norm": 0.00711538502946496,
+      "learning_rate": 3.153363800616431e-05,
+      "loss": 0.0267,
+      "step": 4525
+    },
+    {
+      "epoch": 1.3055954088952655,
+      "grad_norm": 0.005905709229409695,
+      "learning_rate": 3.1400786481028806e-05,
+      "loss": 0.0577,
+      "step": 4550
+    },
+    {
+      "epoch": 1.3127690100430416,
+      "grad_norm": 0.0065200235694646835,
+      "learning_rate": 3.1267934955893295e-05,
+      "loss": 0.0092,
+      "step": 4575
+    },
+    {
+      "epoch": 1.3199426111908177,
+      "grad_norm": 0.007951737381517887,
+      "learning_rate": 3.113508343075779e-05,
+      "loss": 0.0103,
+      "step": 4600
+    },
+    {
+      "epoch": 1.327116212338594,
+      "grad_norm": 0.004364294931292534,
+      "learning_rate": 3.1002231905622275e-05,
+      "loss": 0.0126,
+      "step": 4625
+    },
+    {
+      "epoch": 1.33428981348637,
+      "grad_norm": 0.004744912032037973,
+      "learning_rate": 3.0869380380486764e-05,
+      "loss": 0.0301,
+      "step": 4650
+    },
+    {
+      "epoch": 1.3414634146341464,
+      "grad_norm": 0.006403733976185322,
+      "learning_rate": 3.073652885535126e-05,
+      "loss": 0.0347,
+      "step": 4675
+    },
+    {
+      "epoch": 1.3486370157819225,
+      "grad_norm": 0.004806953482329845,
+      "learning_rate": 3.060367733021575e-05,
+      "loss": 0.0629,
+      "step": 4700
+    },
+    {
+      "epoch": 1.3558106169296988,
+      "grad_norm": 2.9653139114379883,
+      "learning_rate": 3.0470825805080244e-05,
+      "loss": 0.0087,
+      "step": 4725
+    },
+    {
+      "epoch": 1.362984218077475,
+      "grad_norm": 0.0028481949120759964,
+      "learning_rate": 3.0337974279944737e-05,
+      "loss": 0.043,
+      "step": 4750
+    },
+    {
+      "epoch": 1.370157819225251,
+      "grad_norm": 0.005747169256210327,
+      "learning_rate": 3.020512275480923e-05,
+      "loss": 0.0009,
+      "step": 4775
+    },
+    {
+      "epoch": 1.3773314203730274,
+      "grad_norm": 2.9883158206939697,
+      "learning_rate": 3.007227122967372e-05,
+      "loss": 0.0257,
+      "step": 4800
+    },
+    {
+      "epoch": 1.3845050215208035,
+      "grad_norm": 0.009053130634129047,
+      "learning_rate": 2.9939419704538206e-05,
+      "loss": 0.0533,
+      "step": 4825
+    },
+    {
+      "epoch": 1.3916786226685796,
+      "grad_norm": 0.011015841737389565,
+      "learning_rate": 2.98065681794027e-05,
+      "loss": 0.0388,
+      "step": 4850
+    },
+    {
+      "epoch": 1.3988522238163559,
+      "grad_norm": 0.007833955809473991,
+      "learning_rate": 2.9673716654267192e-05,
+      "loss": 0.001,
+      "step": 4875
+    },
+    {
+      "epoch": 1.406025824964132,
+      "grad_norm": 0.0066580744460225105,
+      "learning_rate": 2.9540865129131685e-05,
+      "loss": 0.0008,
+      "step": 4900
+    },
+    {
+      "epoch": 1.413199426111908,
+      "grad_norm": 0.004744118079543114,
+      "learning_rate": 2.9408013603996175e-05,
+      "loss": 0.0361,
+      "step": 4925
+    },
+    {
+      "epoch": 1.4203730272596844,
+      "grad_norm": 0.017294887453317642,
+      "learning_rate": 2.9275162078860668e-05,
+      "loss": 0.0003,
+      "step": 4950
+    },
+    {
+      "epoch": 1.4275466284074605,
+      "grad_norm": 0.019565369933843613,
+      "learning_rate": 2.914231055372516e-05,
+      "loss": 0.0066,
+      "step": 4975
+    },
+    {
+      "epoch": 1.4347202295552366,
+      "grad_norm": 0.005781451240181923,
+      "learning_rate": 2.9009459028589647e-05,
+      "loss": 0.0807,
+      "step": 5000
+    },
+    {
+      "epoch": 1.441893830703013,
+      "grad_norm": 0.018371548503637314,
+      "learning_rate": 2.887660750345414e-05,
+      "loss": 0.0383,
+      "step": 5025
+    },
+    {
+      "epoch": 1.4490674318507892,
+      "grad_norm": 0.019642187282443047,
+      "learning_rate": 2.874375597831863e-05,
+      "loss": 0.0006,
+      "step": 5050
+    },
+    {
+      "epoch": 1.4562410329985653,
+      "grad_norm": 0.016255564987659454,
+      "learning_rate": 2.8610904453183123e-05,
+      "loss": 0.0004,
+      "step": 5075
+    },
+    {
+      "epoch": 1.4634146341463414,
+      "grad_norm": 6.259925365447998,
+      "learning_rate": 2.8478052928047616e-05,
+      "loss": 0.1058,
+      "step": 5100
+    },
+    {
+      "epoch": 1.4705882352941178,
+      "grad_norm": 0.028038620948791504,
+      "learning_rate": 2.834520140291211e-05,
+      "loss": 0.0848,
+      "step": 5125
+    },
+    {
+      "epoch": 1.4777618364418939,
+      "grad_norm": 18.35304832458496,
+      "learning_rate": 2.82123498777766e-05,
+      "loss": 0.0546,
+      "step": 5150
+    },
+    {
+      "epoch": 1.48493543758967,
+      "grad_norm": 0.005022502038627863,
+      "learning_rate": 2.8079498352641086e-05,
+      "loss": 0.0265,
+      "step": 5175
+    },
+    {
+      "epoch": 1.4921090387374463,
+      "grad_norm": 0.011426527984440327,
+      "learning_rate": 2.794664682750558e-05,
+      "loss": 0.017,
+      "step": 5200
+    },
+    {
+      "epoch": 1.4992826398852224,
+      "grad_norm": 0.02600315399467945,
+      "learning_rate": 2.7813795302370072e-05,
+      "loss": 0.001,
+      "step": 5225
+    },
+    {
+      "epoch": 1.5064562410329985,
+      "grad_norm": 0.0031450982205569744,
+      "learning_rate": 2.7680943777234565e-05,
+      "loss": 0.0296,
+      "step": 5250
+    },
+    {
+      "epoch": 1.5136298421807748,
+      "grad_norm": 0.00543051864951849,
+      "learning_rate": 2.7548092252099055e-05,
+      "loss": 0.0004,
+      "step": 5275
+    },
+    {
+      "epoch": 1.5208034433285509,
+      "grad_norm": 0.007613678928464651,
+      "learning_rate": 2.7415240726963548e-05,
+      "loss": 0.0003,
+      "step": 5300
+    },
+    {
+      "epoch": 1.527977044476327,
+      "grad_norm": 0.00250364001840353,
+      "learning_rate": 2.728238920182804e-05,
+      "loss": 0.0217,
+      "step": 5325
+    },
+    {
+      "epoch": 1.5351506456241033,
+      "grad_norm": 0.0024825434666126966,
+      "learning_rate": 2.7149537676692534e-05,
+      "loss": 0.0442,
+      "step": 5350
+    },
+    {
+      "epoch": 1.5423242467718796,
+      "grad_norm": 0.00660035852342844,
+      "learning_rate": 2.701668615155702e-05,
+      "loss": 0.0002,
+      "step": 5375
+    },
+    {
+      "epoch": 1.5494978479196555,
+      "grad_norm": 0.0030255629681050777,
+      "learning_rate": 2.688383462642151e-05,
+      "loss": 0.001,
+      "step": 5400
+    },
+    {
+      "epoch": 1.5566714490674318,
+      "grad_norm": 56.207244873046875,
+      "learning_rate": 2.6750983101286003e-05,
+      "loss": 0.0662,
+      "step": 5425
+    },
+    {
+      "epoch": 1.5638450502152081,
+      "grad_norm": 0.005194812081754208,
+      "learning_rate": 2.6618131576150496e-05,
+      "loss": 0.0004,
+      "step": 5450
+    },
+    {
+      "epoch": 1.5710186513629842,
+      "grad_norm": 0.018478918820619583,
+      "learning_rate": 2.648528005101499e-05,
+      "loss": 0.0786,
+      "step": 5475
+    },
+    {
+      "epoch": 1.5781922525107603,
+      "grad_norm": 67.21288299560547,
+      "learning_rate": 2.635242852587948e-05,
+      "loss": 0.0224,
+      "step": 5500
+    },
+    {
+      "epoch": 1.5853658536585367,
+      "grad_norm": 0.005518095102161169,
+      "learning_rate": 2.6219577000743972e-05,
+      "loss": 0.0005,
+      "step": 5525
+    },
+    {
+      "epoch": 1.5925394548063128,
+      "grad_norm": 0.013573232106864452,
+      "learning_rate": 2.6086725475608458e-05,
+      "loss": 0.0703,
+      "step": 5550
+    },
+    {
+      "epoch": 1.5997130559540889,
+      "grad_norm": 0.022108446806669235,
+      "learning_rate": 2.595387395047295e-05,
+      "loss": 0.0127,
+      "step": 5575
+    },
+    {
+      "epoch": 1.6068866571018652,
+      "grad_norm": 0.02520466223359108,
+      "learning_rate": 2.5821022425337444e-05,
+      "loss": 0.0908,
+      "step": 5600
+    },
+    {
+      "epoch": 1.6140602582496413,
+      "grad_norm": 0.06917204707860947,
+      "learning_rate": 2.5688170900201934e-05,
+      "loss": 0.026,
+      "step": 5625
+    },
+    {
+      "epoch": 1.6212338593974174,
+      "grad_norm": 0.011066574603319168,
+      "learning_rate": 2.5555319375066427e-05,
+      "loss": 0.021,
+      "step": 5650
+    },
+    {
+      "epoch": 1.6284074605451937,
+      "grad_norm": 0.004337651655077934,
+      "learning_rate": 2.542246784993092e-05,
+      "loss": 0.0004,
+      "step": 5675
+    },
+    {
+      "epoch": 1.63558106169297,
+      "grad_norm": 0.007177389692515135,
+      "learning_rate": 2.5289616324795413e-05,
+      "loss": 0.0432,
+      "step": 5700
+    },
+    {
+      "epoch": 1.642754662840746,
+      "grad_norm": 0.004365015309303999,
+      "learning_rate": 2.51567647996599e-05,
+      "loss": 0.0003,
+      "step": 5725
+    },
+    {
+      "epoch": 1.6499282639885222,
+      "grad_norm": 0.005093116778880358,
+      "learning_rate": 2.502391327452439e-05,
+      "loss": 0.0006,
+      "step": 5750
+    },
+    {
+      "epoch": 1.6571018651362985,
+      "grad_norm": 0.00538448104634881,
+      "learning_rate": 2.4891061749388883e-05,
+      "loss": 0.0244,
+      "step": 5775
+    },
+    {
+      "epoch": 1.6642754662840746,
+      "grad_norm": 0.0028270191978663206,
+      "learning_rate": 2.4758210224253376e-05,
+      "loss": 0.0003,
+      "step": 5800
+    },
+    {
+      "epoch": 1.6714490674318507,
+      "grad_norm": 0.004735349677503109,
+      "learning_rate": 2.462535869911787e-05,
+      "loss": 0.0006,
+      "step": 5825
+    },
+    {
+      "epoch": 1.678622668579627,
+      "grad_norm": 0.002434446709230542,
+      "learning_rate": 2.449250717398236e-05,
+      "loss": 0.0348,
+      "step": 5850
+    },
+    {
+      "epoch": 1.6857962697274032,
+      "grad_norm": 9.833294868469238,
+      "learning_rate": 2.4359655648846848e-05,
+      "loss": 0.0005,
+      "step": 5875
+    },
+    {
+      "epoch": 1.6929698708751793,
+      "grad_norm": 0.002602140884846449,
+      "learning_rate": 2.422680412371134e-05,
+      "loss": 0.0311,
+      "step": 5900
+    },
+    {
+      "epoch": 1.7001434720229556,
+      "grad_norm": 0.006632608827203512,
+      "learning_rate": 2.4093952598575834e-05,
+      "loss": 0.0883,
+      "step": 5925
+    },
+    {
+      "epoch": 1.7073170731707317,
+      "grad_norm": 0.009323637932538986,
+      "learning_rate": 2.3961101073440324e-05,
+      "loss": 0.0409,
+      "step": 5950
+    },
+    {
+      "epoch": 1.7144906743185078,
+      "grad_norm": 0.012521679513156414,
+      "learning_rate": 2.3828249548304814e-05,
+      "loss": 0.0282,
+      "step": 5975
+    },
+    {
+      "epoch": 1.721664275466284,
+      "grad_norm": 0.008466576226055622,
+      "learning_rate": 2.3695398023169307e-05,
+      "loss": 0.0244,
+      "step": 6000
+    },
+    {
+      "epoch": 1.7288378766140604,
+      "grad_norm": 0.010361541993916035,
+      "learning_rate": 2.35625464980338e-05,
+      "loss": 0.0356,
+      "step": 6025
+    },
+    {
+      "epoch": 1.7360114777618363,
+      "grad_norm": 0.012751937843859196,
+      "learning_rate": 2.342969497289829e-05,
+      "loss": 0.0847,
+      "step": 6050
+    },
+    {
+      "epoch": 1.7431850789096126,
+      "grad_norm": 0.03529978543519974,
+      "learning_rate": 2.3296843447762783e-05,
+      "loss": 0.0384,
+      "step": 6075
+    },
+    {
+      "epoch": 1.750358680057389,
+      "grad_norm": 0.026526516303420067,
+      "learning_rate": 2.3163991922627273e-05,
+      "loss": 0.0334,
+      "step": 6100
+    },
+    {
+      "epoch": 1.757532281205165,
+      "grad_norm": 0.008869277313351631,
+      "learning_rate": 2.3031140397491766e-05,
+      "loss": 0.0092,
+      "step": 6125
+    },
+    {
+      "epoch": 1.7647058823529411,
+      "grad_norm": 21.071659088134766,
+      "learning_rate": 2.2898288872356255e-05,
+      "loss": 0.049,
+      "step": 6150
+    },
+    {
+      "epoch": 1.7718794835007174,
+      "grad_norm": 0.00842801108956337,
+      "learning_rate": 2.276543734722075e-05,
+      "loss": 0.0406,
+      "step": 6175
+    },
+    {
+      "epoch": 1.7790530846484935,
+      "grad_norm": 0.009631357155740261,
+      "learning_rate": 2.2632585822085238e-05,
+      "loss": 0.0033,
+      "step": 6200
+    },
+    {
+      "epoch": 1.7862266857962696,
+      "grad_norm": 0.015189352445304394,
+      "learning_rate": 2.2499734296949728e-05,
+      "loss": 0.0981,
+      "step": 6225
+    },
+    {
+      "epoch": 1.793400286944046,
+      "grad_norm": 0.13944695889949799,
+      "learning_rate": 2.236688277181422e-05,
+      "loss": 0.0003,
+      "step": 6250
+    },
+    {
+      "epoch": 1.800573888091822,
+      "grad_norm": 0.001980824628844857,
+      "learning_rate": 2.2234031246678714e-05,
+      "loss": 0.0004,
+      "step": 6275
+    },
+    {
+      "epoch": 1.8077474892395982,
+      "grad_norm": 0.005285199265927076,
+      "learning_rate": 2.2101179721543204e-05,
+      "loss": 0.0044,
+      "step": 6300
+    },
+    {
+      "epoch": 1.8149210903873745,
+      "grad_norm": 9.718914031982422,
+      "learning_rate": 2.1968328196407693e-05,
+      "loss": 0.0377,
+      "step": 6325
+    },
+    {
+      "epoch": 1.8220946915351508,
+      "grad_norm": 0.0019531676080077887,
+      "learning_rate": 2.1835476671272187e-05,
+      "loss": 0.0093,
+      "step": 6350
+    },
+    {
+      "epoch": 1.8292682926829267,
+      "grad_norm": 0.0016301467549055815,
+      "learning_rate": 2.170262514613668e-05,
+      "loss": 0.0015,
+      "step": 6375
+    },
+    {
+      "epoch": 1.836441893830703,
+      "grad_norm": 44.472381591796875,
+      "learning_rate": 2.157508768200659e-05,
+      "loss": 0.1747,
+      "step": 6400
+    },
+    {
+      "epoch": 1.8436154949784793,
+      "grad_norm": 0.00314929592423141,
+      "learning_rate": 2.1442236156871082e-05,
+      "loss": 0.0216,
+      "step": 6425
+    },
+    {
+      "epoch": 1.8507890961262554,
+      "grad_norm": 0.003403552807867527,
+      "learning_rate": 2.1309384631735572e-05,
+      "loss": 0.0021,
+      "step": 6450
+    },
+    {
+      "epoch": 1.8579626972740315,
+      "grad_norm": 0.007590115536004305,
+      "learning_rate": 2.1176533106600065e-05,
+      "loss": 0.0012,
+      "step": 6475
+    },
+    {
+      "epoch": 1.8651362984218078,
+      "grad_norm": 0.0027949281502515078,
+      "learning_rate": 2.1043681581464555e-05,
+      "loss": 0.1361,
+      "step": 6500
+    },
+    {
+      "epoch": 1.872309899569584,
+      "grad_norm": 0.00557307805866003,
+      "learning_rate": 2.0910830056329048e-05,
+      "loss": 0.0365,
+      "step": 6525
+    },
+    {
+      "epoch": 1.87948350071736,
+      "grad_norm": 0.010457979515194893,
+      "learning_rate": 2.077797853119354e-05,
+      "loss": 0.0358,
+      "step": 6550
+    },
+    {
+      "epoch": 1.8866571018651364,
+      "grad_norm": 0.003813342424109578,
+      "learning_rate": 2.064512700605803e-05,
+      "loss": 0.0321,
+      "step": 6575
+    },
+    {
+      "epoch": 1.8938307030129125,
+      "grad_norm": 0.00262393313460052,
+      "learning_rate": 2.051227548092252e-05,
+      "loss": 0.022,
+      "step": 6600
+    },
+    {
+      "epoch": 1.9010043041606886,
+      "grad_norm": 0.004526357166469097,
+      "learning_rate": 2.0379423955787014e-05,
+      "loss": 0.0424,
+      "step": 6625
+    },
+    {
+      "epoch": 1.9081779053084649,
+      "grad_norm": 0.01698668673634529,
+      "learning_rate": 2.0246572430651507e-05,
+      "loss": 0.0009,
+      "step": 6650
+    },
+    {
+      "epoch": 1.9153515064562412,
+      "grad_norm": 0.0501057431101799,
+      "learning_rate": 2.0113720905515997e-05,
+      "loss": 0.0237,
+      "step": 6675
+    },
+    {
+      "epoch": 1.922525107604017,
+      "grad_norm": 0.007618068717420101,
+      "learning_rate": 1.9980869380380486e-05,
+      "loss": 0.0192,
+      "step": 6700
+    },
+    {
+      "epoch": 1.9296987087517934,
+      "grad_norm": 0.01174473762512207,
+      "learning_rate": 1.984801785524498e-05,
+      "loss": 0.0334,
+      "step": 6725
+    },
+    {
+      "epoch": 1.9368723098995697,
+      "grad_norm": 25.125062942504883,
+      "learning_rate": 1.9715166330109472e-05,
+      "loss": 0.0098,
+      "step": 6750
+    },
+    {
+      "epoch": 1.9440459110473458,
+      "grad_norm": 0.0056104715913534164,
+      "learning_rate": 1.9582314804973962e-05,
+      "loss": 0.1462,
+      "step": 6775
+    },
+    {
+      "epoch": 1.951219512195122,
+      "grad_norm": 0.05587226152420044,
+      "learning_rate": 1.9449463279838452e-05,
+      "loss": 0.081,
+      "step": 6800
+    },
+    {
+      "epoch": 1.9583931133428982,
+      "grad_norm": 0.01742021180689335,
+      "learning_rate": 1.9316611754702945e-05,
+      "loss": 0.0418,
+      "step": 6825
+    },
+    {
+      "epoch": 1.9655667144906743,
+      "grad_norm": 0.45866331458091736,
+      "learning_rate": 1.9183760229567435e-05,
+      "loss": 0.001,
+      "step": 6850
+    },
+    {
+      "epoch": 1.9727403156384504,
+      "grad_norm": 0.04859813675284386,
+      "learning_rate": 1.9050908704431928e-05,
+      "loss": 0.0302,
+      "step": 6875
+    },
+    {
+      "epoch": 1.9799139167862267,
+      "grad_norm": 0.015134917572140694,
+      "learning_rate": 1.891805717929642e-05,
+      "loss": 0.0418,
+      "step": 6900
+    },
+    {
+      "epoch": 1.9870875179340028,
+      "grad_norm": 0.02702825888991356,
+      "learning_rate": 1.878520565416091e-05,
+      "loss": 0.0419,
+      "step": 6925
+    },
+    {
+      "epoch": 1.994261119081779,
+      "grad_norm": 0.023256802931427956,
+      "learning_rate": 1.86523541290254e-05,
+      "loss": 0.0679,
+      "step": 6950
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9899935442220787,
+      "eval_auc": 0.999704926354536,
+      "eval_f1": 0.9900353584056574,
+      "eval_loss": 0.04012129828333855,
+      "eval_precision": 0.9859154929577465,
+      "eval_recall": 0.9941897998708844,
+      "eval_runtime": 4.2712,
+      "eval_samples_per_second": 725.331,
+      "eval_steps_per_second": 45.421,
+      "step": 6970
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 10455,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 5,
+        "early_stopping_threshold": 0.01
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 1
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 462331386716160.0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-6970/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc076067c3e486e2d8f21770bca521a80d83b3dd7aa04905e6351e987c45120c
+size 5368

config.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "_name_or_path": "TaylorAI/gte-tiny",
+  "_num_labels": 2,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 384,
+  "id2label": {
+    "0": "human",
+    "1": "llm"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 1536,
+  "label2id": {
+    "human": 0,
+    "llm": 1
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e1dc3603f7927d59bbb28381542e7c65f0c7d40444c17d18e2bdefc35a0d77c0
+size 90867952

runs/May30_00-09-04_r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w/events.out.tfevents.1748563746.r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w.75.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:026fbd8aa36c0db2cf89e496f4291903eea3a947dbffe30b3535fea8b3b6ece7
-size 5187

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ff7b0a124a2d68f7bff301a035bc548c9cfe8a0ce636fb1b5ca61415afcb921
+size 95276

runs/May30_00-09-04_r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w/events.out.tfevents.1748564133.r-trentmkelly-autotrain-advanced-9f8hpchj-c1d5e-s6v1w.75.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dd156ae9be79077801d670663261bd82c8f34622e6471e5d2c579df41bb32179
+size 607

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "additional_special_tokens": [
+    "[PAD]",
+    "[UNK]",
+    "[CLS]",
+    "[SEP]",
+    "[MASK]"
+  ],
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,72 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "[PAD]",
+    "[UNK]",
+    "[CLS]",
+    "[SEP]",
+    "[MASK]"
+  ],
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "max_length": 128,
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_to_multiple_of": null,
+  "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
+  "sep_token": "[SEP]",
+  "stride": 0,
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc076067c3e486e2d8f21770bca521a80d83b3dd7aa04905e6351e987c45120c
+size 5368

training_params.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+    "data_path": "slop-detector-mini/autotrain-data",
+    "model": "TaylorAI/gte-tiny",
+    "lr": 5e-05,
+    "epochs": 3,
+    "max_seq_length": 128,
+    "batch_size": 8,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 1,
+    "optimizer": "adamw_torch",
+    "scheduler": "linear",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "train_split": "train",
+    "valid_split": "validation",
+    "text_column": "autotrain_text",
+    "target_column": "autotrain_label",
+    "logging_steps": -1,
+    "project_name": "slop-detector-mini",
+    "auto_find_batch_size": false,
+    "mixed_precision": "fp16",
+    "save_total_limit": 1,
+    "push_to_hub": true,
+    "eval_strategy": "epoch",
+    "username": "trentmkelly",
+    "log": "tensorboard",
+    "early_stopping_patience": 5,
+    "early_stopping_threshold": 0.01
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff