FINE-TUNED WITH MERGED DATASET

Browse files

Files changed (5) hide show

README.md +14 -0
all_results.json +8 -0
runs/Mar03_09-41-24_a2727a3c73a1/events.out.tfevents.1709463658.a2727a3c73a1.593.1 +3 -0
train_results.json +8 -0
trainer_state.json +450 -0

README.md CHANGED Viewed

@@ -3,6 +3,8 @@ license: apache-2.0
 base_model: distilbert-base-uncased
 tags:
 - generated_from_trainer
 model-index:
 - name: finetuning-fake-reviews-detector-model
   results: []
@@ -14,6 +16,18 @@ should probably proofread and complete it, then remove this comment. -->
 # finetuning-fake-reviews-detector-model
 This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
 ## Model description

 base_model: distilbert-base-uncased
 tags:
 - generated_from_trainer
+metrics:
+- accuracy
 model-index:
 - name: finetuning-fake-reviews-detector-model
   results: []
 # finetuning-fake-reviews-detector-model
 This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.4370
+- Accuracy: 0.8844
+- Weighted f1: 0.8821
+- Micro f1: 0.8844
+- Macro f1: 0.8151
+- Weighted recall: 0.8844
+- Micro recall: 0.8844
+- Macro recall: 0.8032
+- Weighted precision: 0.8808
+- Micro precision: 0.8844
+- Macro precision: 0.8293
 ## Model description

all_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 5.0,
+    "total_flos": 1.2565894692964032e+16,
+    "train_loss": 0.27979692445330456,
+    "train_runtime": 4649.1669,
+    "train_samples_per_second": 104.814,
+    "train_steps_per_second": 6.552
+}

runs/Mar03_09-41-24_a2727a3c73a1/events.out.tfevents.1709463658.a2727a3c73a1.593.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91ba59ddae8b0dcd15a5f5a2da464b49febd38a122734d9bd59981a60499c509
+size 936

train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 5.0,
+    "total_flos": 1.2565894692964032e+16,
+    "train_loss": 0.27979692445330456,
+    "train_runtime": 4649.1669,
+    "train_samples_per_second": 104.814,
+    "train_steps_per_second": 6.552
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,450 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 30460,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.08,
+      "grad_norm": 2.0977869033813477,
+      "learning_rate": 1.967170059093894e-05,
+      "loss": 0.4445,
+      "step": 500
+    },
+    {
+      "epoch": 0.16,
+      "grad_norm": 4.845855236053467,
+      "learning_rate": 1.9343401181877874e-05,
+      "loss": 0.4078,
+      "step": 1000
+    },
+    {
+      "epoch": 0.25,
+      "grad_norm": 2.6214709281921387,
+      "learning_rate": 1.901510177281681e-05,
+      "loss": 0.3889,
+      "step": 1500
+    },
+    {
+      "epoch": 0.33,
+      "grad_norm": 1.9115525484085083,
+      "learning_rate": 1.868680236375575e-05,
+      "loss": 0.378,
+      "step": 2000
+    },
+    {
+      "epoch": 0.41,
+      "grad_norm": 1.6511852741241455,
+      "learning_rate": 1.8358502954694683e-05,
+      "loss": 0.3864,
+      "step": 2500
+    },
+    {
+      "epoch": 0.49,
+      "grad_norm": 2.835732936859131,
+      "learning_rate": 1.803020354563362e-05,
+      "loss": 0.3795,
+      "step": 3000
+    },
+    {
+      "epoch": 0.57,
+      "grad_norm": 2.6627590656280518,
+      "learning_rate": 1.7701904136572555e-05,
+      "loss": 0.3709,
+      "step": 3500
+    },
+    {
+      "epoch": 0.66,
+      "grad_norm": 2.168017864227295,
+      "learning_rate": 1.7373604727511493e-05,
+      "loss": 0.3606,
+      "step": 4000
+    },
+    {
+      "epoch": 0.74,
+      "grad_norm": 1.1796438694000244,
+      "learning_rate": 1.704530531845043e-05,
+      "loss": 0.375,
+      "step": 4500
+    },
+    {
+      "epoch": 0.82,
+      "grad_norm": 1.51750910282135,
+      "learning_rate": 1.6717005909389364e-05,
+      "loss": 0.3616,
+      "step": 5000
+    },
+    {
+      "epoch": 0.9,
+      "grad_norm": 0.9447911381721497,
+      "learning_rate": 1.63887065003283e-05,
+      "loss": 0.3585,
+      "step": 5500
+    },
+    {
+      "epoch": 0.98,
+      "grad_norm": 3.0596373081207275,
+      "learning_rate": 1.6060407091267236e-05,
+      "loss": 0.3501,
+      "step": 6000
+    },
+    {
+      "epoch": 1.07,
+      "grad_norm": 5.587700843811035,
+      "learning_rate": 1.5732107682206174e-05,
+      "loss": 0.3357,
+      "step": 6500
+    },
+    {
+      "epoch": 1.15,
+      "grad_norm": 2.992246389389038,
+      "learning_rate": 1.5403808273145108e-05,
+      "loss": 0.3269,
+      "step": 7000
+    },
+    {
+      "epoch": 1.23,
+      "grad_norm": 0.933838963508606,
+      "learning_rate": 1.5075508864084046e-05,
+      "loss": 0.3241,
+      "step": 7500
+    },
+    {
+      "epoch": 1.31,
+      "grad_norm": 6.16735315322876,
+      "learning_rate": 1.4747209455022982e-05,
+      "loss": 0.3255,
+      "step": 8000
+    },
+    {
+      "epoch": 1.4,
+      "grad_norm": 6.236515522003174,
+      "learning_rate": 1.4418910045961918e-05,
+      "loss": 0.3412,
+      "step": 8500
+    },
+    {
+      "epoch": 1.48,
+      "grad_norm": 2.5656967163085938,
+      "learning_rate": 1.4090610636900854e-05,
+      "loss": 0.3349,
+      "step": 9000
+    },
+    {
+      "epoch": 1.56,
+      "grad_norm": 1.8035532236099243,
+      "learning_rate": 1.3762311227839791e-05,
+      "loss": 0.3133,
+      "step": 9500
+    },
+    {
+      "epoch": 1.64,
+      "grad_norm": 8.10788631439209,
+      "learning_rate": 1.3434011818778727e-05,
+      "loss": 0.3275,
+      "step": 10000
+    },
+    {
+      "epoch": 1.72,
+      "grad_norm": 2.249290943145752,
+      "learning_rate": 1.3105712409717663e-05,
+      "loss": 0.3144,
+      "step": 10500
+    },
+    {
+      "epoch": 1.81,
+      "grad_norm": 3.0741331577301025,
+      "learning_rate": 1.27774130006566e-05,
+      "loss": 0.3198,
+      "step": 11000
+    },
+    {
+      "epoch": 1.89,
+      "grad_norm": 3.473233699798584,
+      "learning_rate": 1.2449113591595537e-05,
+      "loss": 0.31,
+      "step": 11500
+    },
+    {
+      "epoch": 1.97,
+      "grad_norm": 3.777818441390991,
+      "learning_rate": 1.2120814182534473e-05,
+      "loss": 0.3272,
+      "step": 12000
+    },
+    {
+      "epoch": 2.05,
+      "grad_norm": 3.420518636703491,
+      "learning_rate": 1.1792514773473409e-05,
+      "loss": 0.2844,
+      "step": 12500
+    },
+    {
+      "epoch": 2.13,
+      "grad_norm": 0.9904893040657043,
+      "learning_rate": 1.1464215364412346e-05,
+      "loss": 0.285,
+      "step": 13000
+    },
+    {
+      "epoch": 2.22,
+      "grad_norm": 1.798154592514038,
+      "learning_rate": 1.1135915955351282e-05,
+      "loss": 0.269,
+      "step": 13500
+    },
+    {
+      "epoch": 2.3,
+      "grad_norm": 8.202375411987305,
+      "learning_rate": 1.0807616546290218e-05,
+      "loss": 0.2851,
+      "step": 14000
+    },
+    {
+      "epoch": 2.38,
+      "grad_norm": 6.387328147888184,
+      "learning_rate": 1.0479317137229154e-05,
+      "loss": 0.2713,
+      "step": 14500
+    },
+    {
+      "epoch": 2.46,
+      "grad_norm": 9.065672874450684,
+      "learning_rate": 1.0151017728168092e-05,
+      "loss": 0.2685,
+      "step": 15000
+    },
+    {
+      "epoch": 2.54,
+      "grad_norm": 1.2352772951126099,
+      "learning_rate": 9.822718319107026e-06,
+      "loss": 0.2857,
+      "step": 15500
+    },
+    {
+      "epoch": 2.63,
+      "grad_norm": 8.483463287353516,
+      "learning_rate": 9.494418910045962e-06,
+      "loss": 0.2722,
+      "step": 16000
+    },
+    {
+      "epoch": 2.71,
+      "grad_norm": 4.678401947021484,
+      "learning_rate": 9.1661195009849e-06,
+      "loss": 0.2654,
+      "step": 16500
+    },
+    {
+      "epoch": 2.79,
+      "grad_norm": 6.603830814361572,
+      "learning_rate": 8.837820091923836e-06,
+      "loss": 0.2748,
+      "step": 17000
+    },
+    {
+      "epoch": 2.87,
+      "grad_norm": 8.765490531921387,
+      "learning_rate": 8.509520682862772e-06,
+      "loss": 0.2742,
+      "step": 17500
+    },
+    {
+      "epoch": 2.95,
+      "grad_norm": 0.8734021782875061,
+      "learning_rate": 8.181221273801707e-06,
+      "loss": 0.2897,
+      "step": 18000
+    },
+    {
+      "epoch": 3.04,
+      "grad_norm": 6.885056018829346,
+      "learning_rate": 7.852921864740645e-06,
+      "loss": 0.2477,
+      "step": 18500
+    },
+    {
+      "epoch": 3.12,
+      "grad_norm": 19.46624755859375,
+      "learning_rate": 7.52462245567958e-06,
+      "loss": 0.2134,
+      "step": 19000
+    },
+    {
+      "epoch": 3.2,
+      "grad_norm": 3.132298231124878,
+      "learning_rate": 7.196323046618516e-06,
+      "loss": 0.2377,
+      "step": 19500
+    },
+    {
+      "epoch": 3.28,
+      "grad_norm": 3.616292715072632,
+      "learning_rate": 6.868023637557453e-06,
+      "loss": 0.2314,
+      "step": 20000
+    },
+    {
+      "epoch": 3.37,
+      "grad_norm": 36.205810546875,
+      "learning_rate": 6.539724228496389e-06,
+      "loss": 0.2253,
+      "step": 20500
+    },
+    {
+      "epoch": 3.45,
+      "grad_norm": 5.153477191925049,
+      "learning_rate": 6.211424819435326e-06,
+      "loss": 0.2289,
+      "step": 21000
+    },
+    {
+      "epoch": 3.53,
+      "grad_norm": 5.419785499572754,
+      "learning_rate": 5.883125410374262e-06,
+      "loss": 0.216,
+      "step": 21500
+    },
+    {
+      "epoch": 3.61,
+      "grad_norm": 1.2598270177841187,
+      "learning_rate": 5.554826001313198e-06,
+      "loss": 0.2354,
+      "step": 22000
+    },
+    {
+      "epoch": 3.69,
+      "grad_norm": 3.154592752456665,
+      "learning_rate": 5.226526592252134e-06,
+      "loss": 0.226,
+      "step": 22500
+    },
+    {
+      "epoch": 3.78,
+      "grad_norm": 6.700149059295654,
+      "learning_rate": 4.89822718319107e-06,
+      "loss": 0.2322,
+      "step": 23000
+    },
+    {
+      "epoch": 3.86,
+      "grad_norm": 7.298892021179199,
+      "learning_rate": 4.569927774130007e-06,
+      "loss": 0.222,
+      "step": 23500
+    },
+    {
+      "epoch": 3.94,
+      "grad_norm": 3.5850930213928223,
+      "learning_rate": 4.241628365068943e-06,
+      "loss": 0.2348,
+      "step": 24000
+    },
+    {
+      "epoch": 4.02,
+      "grad_norm": 9.055290222167969,
+      "learning_rate": 3.91332895600788e-06,
+      "loss": 0.2222,
+      "step": 24500
+    },
+    {
+      "epoch": 4.1,
+      "grad_norm": 14.489812850952148,
+      "learning_rate": 3.585029546946816e-06,
+      "loss": 0.1874,
+      "step": 25000
+    },
+    {
+      "epoch": 4.19,
+      "grad_norm": 5.70402717590332,
+      "learning_rate": 3.2567301378857517e-06,
+      "loss": 0.2021,
+      "step": 25500
+    },
+    {
+      "epoch": 4.27,
+      "grad_norm": 1.1003680229187012,
+      "learning_rate": 2.928430728824688e-06,
+      "loss": 0.1928,
+      "step": 26000
+    },
+    {
+      "epoch": 4.35,
+      "grad_norm": 20.254186630249023,
+      "learning_rate": 2.6001313197636244e-06,
+      "loss": 0.1994,
+      "step": 26500
+    },
+    {
+      "epoch": 4.43,
+      "grad_norm": 37.06382751464844,
+      "learning_rate": 2.2718319107025612e-06,
+      "loss": 0.1896,
+      "step": 27000
+    },
+    {
+      "epoch": 4.51,
+      "grad_norm": 30.246774673461914,
+      "learning_rate": 1.943532501641497e-06,
+      "loss": 0.1911,
+      "step": 27500
+    },
+    {
+      "epoch": 4.6,
+      "grad_norm": 1.3807177543640137,
+      "learning_rate": 1.6152330925804335e-06,
+      "loss": 0.1982,
+      "step": 28000
+    },
+    {
+      "epoch": 4.68,
+      "grad_norm": 18.111328125,
+      "learning_rate": 1.2869336835193697e-06,
+      "loss": 0.1931,
+      "step": 28500
+    },
+    {
+      "epoch": 4.76,
+      "grad_norm": 30.377147674560547,
+      "learning_rate": 9.58634274458306e-07,
+      "loss": 0.1897,
+      "step": 29000
+    },
+    {
+      "epoch": 4.84,
+      "grad_norm": 7.666069507598877,
+      "learning_rate": 6.303348653972423e-07,
+      "loss": 0.1876,
+      "step": 29500
+    },
+    {
+      "epoch": 4.92,
+      "grad_norm": 15.851324081420898,
+      "learning_rate": 3.020354563361786e-07,
+      "loss": 0.1757,
+      "step": 30000
+    },
+    {
+      "epoch": 5.0,
+      "step": 30460,
+      "total_flos": 1.2565894692964032e+16,
+      "train_loss": 0.27979692445330456,
+      "train_runtime": 4649.1669,
+      "train_samples_per_second": 104.814,
+      "train_steps_per_second": 6.552
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 30460,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 1.2565894692964032e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}