elselse commited on
Commit
1e64166
·
verified ·
1 Parent(s): c75c61f

End of training

Browse files
Files changed (5) hide show
  1. README.md +6 -6
  2. config.json +58 -81
  3. emissions.csv +1 -1
  4. metrics.json +4 -4
  5. pytorch_model.bin +3 -0
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.0532
20
  - F1 Macro: 0.0
21
  - Exact Match: 1.0
22
 
@@ -49,11 +49,11 @@ The following hyperparameters were used during training:
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | F1 Macro | Exact Match |
51
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:-----------:|
52
- | 0.263 | 1.0 | 25 | 0.1400 | 0.0 | 1.0 |
53
- | 0.1315 | 2.0 | 50 | 0.0867 | 0.0 | 1.0 |
54
- | 0.0903 | 3.0 | 75 | 0.0652 | 0.0 | 1.0 |
55
- | 0.0604 | 4.0 | 100 | 0.0560 | 0.0 | 1.0 |
56
- | 0.0556 | 5.0 | 125 | 0.0532 | 0.0 | 1.0 |
57
 
58
 
59
  ### Framework versions
 
16
 
17
  This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.0397
20
  - F1 Macro: 0.0
21
  - Exact Match: 1.0
22
 
 
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | F1 Macro | Exact Match |
51
  |:-------------:|:-----:|:----:|:---------------:|:--------:|:-----------:|
52
+ | 0.3138 | 1.0 | 25 | 0.0876 | 0.0 | 1.0 |
53
+ | 0.0895 | 2.0 | 50 | 0.0536 | 0.0 | 1.0 |
54
+ | 0.0625 | 3.0 | 75 | 0.0448 | 0.0 | 1.0 |
55
+ | 0.0486 | 4.0 | 100 | 0.0408 | 0.0 | 1.0 |
56
+ | 0.0462 | 5.0 | 125 | 0.0397 | 0.0 | 1.0 |
57
 
58
 
59
  ### Framework versions
config.json CHANGED
@@ -1,82 +1,59 @@
1
  {
2
- "architectures": [
3
- "MultiLabelClassificationModel"
4
- ],
5
- "attention_probs_dropout_prob": 0.1,
6
- "bos_token_id": 0,
7
- "classifier_dropout": null,
8
- "eos_token_id": 2,
9
- "hidden_act": "gelu",
10
- "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
- "id2label": {
13
- "0": "1025",
14
- "1": "1071",
15
- "2": "131",
16
- "3": "138",
17
- "4": "284",
18
- "5": "285",
19
- "6": "435",
20
- "7": "436",
21
- "8": "595",
22
- "9": "657",
23
- "10": "664",
24
- "11": "682",
25
- "12": "684",
26
- "13": "691",
27
- "14": "693",
28
- "15": "697",
29
- "16": "703",
30
- "17": "706",
31
- "18": "707",
32
- "19": "710",
33
- "20": "74",
34
- "21": "754",
35
- "22": "829",
36
- "23": "862",
37
- "24": "913",
38
- "25": "94"
39
- },
40
- "initializer_range": 0.02,
41
- "intermediate_size": 3072,
42
- "label2id": {
43
- "1025": 0,
44
- "1071": 1,
45
- "131": 2,
46
- "138": 3,
47
- "284": 4,
48
- "285": 5,
49
- "435": 6,
50
- "436": 7,
51
- "595": 8,
52
- "657": 9,
53
- "664": 10,
54
- "682": 11,
55
- "684": 12,
56
- "691": 13,
57
- "693": 14,
58
- "697": 15,
59
- "703": 16,
60
- "706": 17,
61
- "707": 18,
62
- "710": 19,
63
- "74": 20,
64
- "754": 21,
65
- "829": 22,
66
- "862": 23,
67
- "913": 24,
68
- "94": 25
69
- },
70
- "layer_norm_eps": 1e-05,
71
- "max_position_embeddings": 514,
72
- "model_type": "roberta",
73
- "num_attention_heads": 12,
74
- "num_hidden_layers": 12,
75
- "pad_token_id": 1,
76
- "position_embedding_type": "absolute",
77
- "torch_dtype": "float32",
78
- "transformers_version": "4.55.0",
79
- "type_vocab_size": 1,
80
- "use_cache": true,
81
- "vocab_size": 50265
82
- }
 
1
  {
2
+ "num_labels": 26,
3
+ "id2label": {
4
+ "0": "1025",
5
+ "1": "1071",
6
+ "2": "131",
7
+ "3": "138",
8
+ "4": "284",
9
+ "5": "285",
10
+ "6": "435",
11
+ "7": "436",
12
+ "8": "595",
13
+ "9": "657",
14
+ "10": "664",
15
+ "11": "682",
16
+ "12": "684",
17
+ "13": "691",
18
+ "14": "693",
19
+ "15": "697",
20
+ "16": "703",
21
+ "17": "706",
22
+ "18": "707",
23
+ "19": "710",
24
+ "20": "74",
25
+ "21": "754",
26
+ "22": "829",
27
+ "23": "862",
28
+ "24": "913",
29
+ "25": "94"
30
+ },
31
+ "label2id": {
32
+ "1025": 0,
33
+ "1071": 1,
34
+ "131": 2,
35
+ "138": 3,
36
+ "284": 4,
37
+ "285": 5,
38
+ "435": 6,
39
+ "436": 7,
40
+ "595": 8,
41
+ "657": 9,
42
+ "664": 10,
43
+ "682": 11,
44
+ "684": 12,
45
+ "691": 13,
46
+ "693": 14,
47
+ "697": 15,
48
+ "703": 16,
49
+ "706": 17,
50
+ "707": 18,
51
+ "710": 19,
52
+ "74": 20,
53
+ "754": 21,
54
+ "829": 22,
55
+ "862": 23,
56
+ "913": 24,
57
+ "94": 25
58
+ }
59
+ }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
emissions.csv CHANGED
@@ -1,2 +1,2 @@
1
  timestamp,project_name,run_id,experiment_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
- 2025-08-27T14:50:19,codecarbon,b680ab9c-d4ee-437c-8326-9f2fe212f3d5,5b0fa12a-3dd7-45bb-9766-cc326314d9f1,48.50631881784648,0.000662966361586643,1.3667628831539448e-05,42.5,170.99735240530177,94.34468507766725,0.0005723921319536102,0.004455213286391313,0.0012705844640130096,0.0062981898823579316,Luxembourg,LUX,luxembourg,,,Linux-6.8.0-71-generic-x86_64-with-glibc2.39,3.12.3,2.8.4,64,AMD EPYC 9124 16-Core Processor,2,2 x NVIDIA L40S,6.1294,49.6113,251.5858268737793,machine,N,1.0
 
1
  timestamp,project_name,run_id,experiment_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
+ 2025-08-27T15:56:42,codecarbon,3997a6b2-dbc8-4248-b049-8e0a8e2524a2,5b0fa12a-3dd7-45bb-9766-cc326314d9f1,42.24432637006976,0.0005517388648629392,1.3060661922493051e-05,42.5,266.00938047930725,94.34468507766725,0.0004984712969778533,0.00363654790924528,0.0011065078722654056,0.005241527078488539,Luxembourg,LUX,luxembourg,,,Linux-6.8.0-71-generic-x86_64-with-glibc2.39,3.12.3,2.8.4,64,AMD EPYC 9124 16-Core Processor,2,2 x NVIDIA L40S,6.1294,49.6113,251.5858268737793,machine,N,1.0
metrics.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "eval_loss": 0.05322767049074173,
3
  "eval_f1_macro": 0.0,
4
  "eval_exact_match": 1.0,
5
- "eval_runtime": 0.3388,
6
- "eval_samples_per_second": 262.655,
7
- "eval_steps_per_second": 8.854,
8
  "epoch": 5.0
9
  }
 
1
  {
2
+ "eval_loss": 0.039671141654253006,
3
  "eval_f1_macro": 0.0,
4
  "eval_exact_match": 1.0,
5
+ "eval_runtime": 0.263,
6
+ "eval_samples_per_second": 338.428,
7
+ "eval_steps_per_second": 11.408,
8
  "epoch": 5.0
9
  }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23f91079994b61055a2f22748cee2ca6f8abcfe57e51cd2a4b0f04c5896aecc9
3
+ size 498747403