End of training
Browse files- README.md +6 -6
- config.json +58 -81
- emissions.csv +1 -1
- metrics.json +4 -4
- pytorch_model.bin +3 -0
README.md
CHANGED
|
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
| 16 |
|
| 17 |
This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on an unknown dataset.
|
| 18 |
It achieves the following results on the evaluation set:
|
| 19 |
-
- Loss: 0.
|
| 20 |
- F1 Macro: 0.0
|
| 21 |
- Exact Match: 1.0
|
| 22 |
|
|
@@ -49,11 +49,11 @@ The following hyperparameters were used during training:
|
|
| 49 |
|
| 50 |
| Training Loss | Epoch | Step | Validation Loss | F1 Macro | Exact Match |
|
| 51 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|:-----------:|
|
| 52 |
-
| 0.
|
| 53 |
-
| 0.
|
| 54 |
-
| 0.
|
| 55 |
-
| 0.
|
| 56 |
-
| 0.
|
| 57 |
|
| 58 |
|
| 59 |
### Framework versions
|
|
|
|
| 16 |
|
| 17 |
This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on an unknown dataset.
|
| 18 |
It achieves the following results on the evaluation set:
|
| 19 |
+
- Loss: 0.0397
|
| 20 |
- F1 Macro: 0.0
|
| 21 |
- Exact Match: 1.0
|
| 22 |
|
|
|
|
| 49 |
|
| 50 |
| Training Loss | Epoch | Step | Validation Loss | F1 Macro | Exact Match |
|
| 51 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|:-----------:|
|
| 52 |
+
| 0.3138 | 1.0 | 25 | 0.0876 | 0.0 | 1.0 |
|
| 53 |
+
| 0.0895 | 2.0 | 50 | 0.0536 | 0.0 | 1.0 |
|
| 54 |
+
| 0.0625 | 3.0 | 75 | 0.0448 | 0.0 | 1.0 |
|
| 55 |
+
| 0.0486 | 4.0 | 100 | 0.0408 | 0.0 | 1.0 |
|
| 56 |
+
| 0.0462 | 5.0 | 125 | 0.0397 | 0.0 | 1.0 |
|
| 57 |
|
| 58 |
|
| 59 |
### Framework versions
|
config.json
CHANGED
|
@@ -1,82 +1,59 @@
|
|
| 1 |
{
|
| 2 |
-
|
| 3 |
-
"
|
| 4 |
-
|
| 5 |
-
|
| 6 |
-
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
| 16 |
-
|
| 17 |
-
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
|
| 26 |
-
|
| 27 |
-
|
| 28 |
-
|
| 29 |
-
|
| 30 |
-
|
| 31 |
-
"
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
| 36 |
-
|
| 37 |
-
|
| 38 |
-
|
| 39 |
-
|
| 40 |
-
|
| 41 |
-
|
| 42 |
-
|
| 43 |
-
|
| 44 |
-
|
| 45 |
-
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
| 49 |
-
|
| 50 |
-
|
| 51 |
-
|
| 52 |
-
|
| 53 |
-
|
| 54 |
-
|
| 55 |
-
|
| 56 |
-
|
| 57 |
-
|
| 58 |
-
|
| 59 |
-
|
| 60 |
-
"706": 17,
|
| 61 |
-
"707": 18,
|
| 62 |
-
"710": 19,
|
| 63 |
-
"74": 20,
|
| 64 |
-
"754": 21,
|
| 65 |
-
"829": 22,
|
| 66 |
-
"862": 23,
|
| 67 |
-
"913": 24,
|
| 68 |
-
"94": 25
|
| 69 |
-
},
|
| 70 |
-
"layer_norm_eps": 1e-05,
|
| 71 |
-
"max_position_embeddings": 514,
|
| 72 |
-
"model_type": "roberta",
|
| 73 |
-
"num_attention_heads": 12,
|
| 74 |
-
"num_hidden_layers": 12,
|
| 75 |
-
"pad_token_id": 1,
|
| 76 |
-
"position_embedding_type": "absolute",
|
| 77 |
-
"torch_dtype": "float32",
|
| 78 |
-
"transformers_version": "4.55.0",
|
| 79 |
-
"type_vocab_size": 1,
|
| 80 |
-
"use_cache": true,
|
| 81 |
-
"vocab_size": 50265
|
| 82 |
-
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"num_labels": 26,
|
| 3 |
+
"id2label": {
|
| 4 |
+
"0": "1025",
|
| 5 |
+
"1": "1071",
|
| 6 |
+
"2": "131",
|
| 7 |
+
"3": "138",
|
| 8 |
+
"4": "284",
|
| 9 |
+
"5": "285",
|
| 10 |
+
"6": "435",
|
| 11 |
+
"7": "436",
|
| 12 |
+
"8": "595",
|
| 13 |
+
"9": "657",
|
| 14 |
+
"10": "664",
|
| 15 |
+
"11": "682",
|
| 16 |
+
"12": "684",
|
| 17 |
+
"13": "691",
|
| 18 |
+
"14": "693",
|
| 19 |
+
"15": "697",
|
| 20 |
+
"16": "703",
|
| 21 |
+
"17": "706",
|
| 22 |
+
"18": "707",
|
| 23 |
+
"19": "710",
|
| 24 |
+
"20": "74",
|
| 25 |
+
"21": "754",
|
| 26 |
+
"22": "829",
|
| 27 |
+
"23": "862",
|
| 28 |
+
"24": "913",
|
| 29 |
+
"25": "94"
|
| 30 |
+
},
|
| 31 |
+
"label2id": {
|
| 32 |
+
"1025": 0,
|
| 33 |
+
"1071": 1,
|
| 34 |
+
"131": 2,
|
| 35 |
+
"138": 3,
|
| 36 |
+
"284": 4,
|
| 37 |
+
"285": 5,
|
| 38 |
+
"435": 6,
|
| 39 |
+
"436": 7,
|
| 40 |
+
"595": 8,
|
| 41 |
+
"657": 9,
|
| 42 |
+
"664": 10,
|
| 43 |
+
"682": 11,
|
| 44 |
+
"684": 12,
|
| 45 |
+
"691": 13,
|
| 46 |
+
"693": 14,
|
| 47 |
+
"697": 15,
|
| 48 |
+
"703": 16,
|
| 49 |
+
"706": 17,
|
| 50 |
+
"707": 18,
|
| 51 |
+
"710": 19,
|
| 52 |
+
"74": 20,
|
| 53 |
+
"754": 21,
|
| 54 |
+
"829": 22,
|
| 55 |
+
"862": 23,
|
| 56 |
+
"913": 24,
|
| 57 |
+
"94": 25
|
| 58 |
+
}
|
| 59 |
+
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
emissions.csv
CHANGED
|
@@ -1,2 +1,2 @@
|
|
| 1 |
timestamp,project_name,run_id,experiment_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
|
| 2 |
-
2025-08-
|
|
|
|
| 1 |
timestamp,project_name,run_id,experiment_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
|
| 2 |
+
2025-08-27T15:56:42,codecarbon,3997a6b2-dbc8-4248-b049-8e0a8e2524a2,5b0fa12a-3dd7-45bb-9766-cc326314d9f1,42.24432637006976,0.0005517388648629392,1.3060661922493051e-05,42.5,266.00938047930725,94.34468507766725,0.0004984712969778533,0.00363654790924528,0.0011065078722654056,0.005241527078488539,Luxembourg,LUX,luxembourg,,,Linux-6.8.0-71-generic-x86_64-with-glibc2.39,3.12.3,2.8.4,64,AMD EPYC 9124 16-Core Processor,2,2 x NVIDIA L40S,6.1294,49.6113,251.5858268737793,machine,N,1.0
|
metrics.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
-
"eval_loss": 0.
|
| 3 |
"eval_f1_macro": 0.0,
|
| 4 |
"eval_exact_match": 1.0,
|
| 5 |
-
"eval_runtime": 0.
|
| 6 |
-
"eval_samples_per_second":
|
| 7 |
-
"eval_steps_per_second":
|
| 8 |
"epoch": 5.0
|
| 9 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"eval_loss": 0.039671141654253006,
|
| 3 |
"eval_f1_macro": 0.0,
|
| 4 |
"eval_exact_match": 1.0,
|
| 5 |
+
"eval_runtime": 0.263,
|
| 6 |
+
"eval_samples_per_second": 338.428,
|
| 7 |
+
"eval_steps_per_second": 11.408,
|
| 8 |
"epoch": 5.0
|
| 9 |
}
|
pytorch_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23f91079994b61055a2f22748cee2ca6f8abcfe57e51cd2a4b0f04c5896aecc9
|
| 3 |
+
size 498747403
|