Upload folder using huggingface_hub
Browse files- Models/checkpoint-272/config.json +28 -0
- Models/checkpoint-272/model.safetensors +3 -0
- Models/checkpoint-272/optimizer.pt +3 -0
- Models/checkpoint-272/rng_state.pth +3 -0
- Models/checkpoint-272/scheduler.pt +3 -0
- Models/checkpoint-272/sentencepiece.bpe.model +3 -0
- Models/checkpoint-272/special_tokens_map.json +15 -0
- Models/checkpoint-272/tokenizer.json +3 -0
- Models/checkpoint-272/tokenizer_config.json +55 -0
- Models/checkpoint-272/trainer_state.json +67 -0
- Models/checkpoint-272/training_args.bin +3 -0
- Models/final_model/model.safetensors +1 -1
- guiltbert_train_v2.xlsx +2 -2
- logs/events.out.tfevents.1744199527.0b7e6b5f708f.286.0 +3 -0
- model.safetensors +1 -1
Models/checkpoint-272/config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"XLMRobertaForSequenceClassification"
|
4 |
+
],
|
5 |
+
"attention_probs_dropout_prob": 0.1,
|
6 |
+
"bos_token_id": 0,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"layer_norm_eps": 1e-05,
|
15 |
+
"max_position_embeddings": 514,
|
16 |
+
"model_type": "xlm-roberta",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"output_past": true,
|
20 |
+
"pad_token_id": 1,
|
21 |
+
"position_embedding_type": "absolute",
|
22 |
+
"problem_type": "single_label_classification",
|
23 |
+
"torch_dtype": "float32",
|
24 |
+
"transformers_version": "4.50.3",
|
25 |
+
"type_vocab_size": 1,
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 250002
|
28 |
+
}
|
Models/checkpoint-272/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca3c01e4dca2372e12227f90b59e510a181423744f1f05fc605195a80bab6f10
|
3 |
+
size 1112205008
|
Models/checkpoint-272/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a7e38b811f8ed8f21b7b32682f12cd92b190e9221b70bb3210ce4081c7a3e2e
|
3 |
+
size 2224529658
|
Models/checkpoint-272/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a424bdeaff073831b64d6f171b96733f4d88b27d6a36dadfdd07586eea122c9
|
3 |
+
size 14244
|
Models/checkpoint-272/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fe9fbdc3d94b1235d48f135c4328ab9b7b3437e2ffcce13759551532f697119
|
3 |
+
size 1064
|
Models/checkpoint-272/sentencepiece.bpe.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
|
3 |
+
size 5069051
|
Models/checkpoint-272/special_tokens_map.json
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": "<s>",
|
3 |
+
"cls_token": "<s>",
|
4 |
+
"eos_token": "</s>",
|
5 |
+
"mask_token": {
|
6 |
+
"content": "<mask>",
|
7 |
+
"lstrip": true,
|
8 |
+
"normalized": false,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false
|
11 |
+
},
|
12 |
+
"pad_token": "<pad>",
|
13 |
+
"sep_token": "</s>",
|
14 |
+
"unk_token": "<unk>"
|
15 |
+
}
|
Models/checkpoint-272/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93189c5d9a15db043017cfd920e00cf72fe9a4220bd74b460b635f6aa85a61a2
|
3 |
+
size 17082999
|
Models/checkpoint-272/tokenizer_config.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "<s>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "<pad>",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "</s>",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "<unk>",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"250001": {
|
36 |
+
"content": "<mask>",
|
37 |
+
"lstrip": true,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"bos_token": "<s>",
|
45 |
+
"clean_up_tokenization_spaces": false,
|
46 |
+
"cls_token": "<s>",
|
47 |
+
"eos_token": "</s>",
|
48 |
+
"extra_special_tokens": {},
|
49 |
+
"mask_token": "<mask>",
|
50 |
+
"model_max_length": 512,
|
51 |
+
"pad_token": "<pad>",
|
52 |
+
"sep_token": "</s>",
|
53 |
+
"tokenizer_class": "XLMRobertaTokenizer",
|
54 |
+
"unk_token": "<unk>"
|
55 |
+
}
|
Models/checkpoint-272/trainer_state.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_global_step": 272,
|
3 |
+
"best_metric": 0.23731659352779388,
|
4 |
+
"best_model_checkpoint": "/content/drive/MyDrive/guilt_v2/Models/checkpoint-272",
|
5 |
+
"epoch": 2.0,
|
6 |
+
"eval_steps": 500,
|
7 |
+
"global_step": 272,
|
8 |
+
"is_hyper_param_search": false,
|
9 |
+
"is_local_process_zero": true,
|
10 |
+
"is_world_process_zero": true,
|
11 |
+
"log_history": [
|
12 |
+
{
|
13 |
+
"epoch": 1.0,
|
14 |
+
"eval_accuracy": 0.9356223175965666,
|
15 |
+
"eval_f1": 0.935053775423736,
|
16 |
+
"eval_loss": 0.2828504741191864,
|
17 |
+
"eval_precision": 0.9405556901030809,
|
18 |
+
"eval_recall": 0.9356223175965666,
|
19 |
+
"eval_runtime": 6.4181,
|
20 |
+
"eval_samples_per_second": 72.607,
|
21 |
+
"eval_steps_per_second": 4.674,
|
22 |
+
"step": 136
|
23 |
+
},
|
24 |
+
{
|
25 |
+
"epoch": 2.0,
|
26 |
+
"eval_accuracy": 0.9527896995708155,
|
27 |
+
"eval_f1": 0.9526360064059696,
|
28 |
+
"eval_loss": 0.23731659352779388,
|
29 |
+
"eval_precision": 0.9537728835339494,
|
30 |
+
"eval_recall": 0.9527896995708155,
|
31 |
+
"eval_runtime": 6.2175,
|
32 |
+
"eval_samples_per_second": 74.95,
|
33 |
+
"eval_steps_per_second": 4.825,
|
34 |
+
"step": 272
|
35 |
+
}
|
36 |
+
],
|
37 |
+
"logging_steps": 500,
|
38 |
+
"max_steps": 680,
|
39 |
+
"num_input_tokens_seen": 0,
|
40 |
+
"num_train_epochs": 5,
|
41 |
+
"save_steps": 500,
|
42 |
+
"stateful_callbacks": {
|
43 |
+
"EarlyStoppingCallback": {
|
44 |
+
"args": {
|
45 |
+
"early_stopping_patience": 2,
|
46 |
+
"early_stopping_threshold": 0.0
|
47 |
+
},
|
48 |
+
"attributes": {
|
49 |
+
"early_stopping_patience_counter": 0
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"TrainerControl": {
|
53 |
+
"args": {
|
54 |
+
"should_epoch_stop": false,
|
55 |
+
"should_evaluate": false,
|
56 |
+
"should_log": false,
|
57 |
+
"should_save": true,
|
58 |
+
"should_training_stop": false
|
59 |
+
},
|
60 |
+
"attributes": {}
|
61 |
+
}
|
62 |
+
},
|
63 |
+
"total_flos": 572266545408000.0,
|
64 |
+
"train_batch_size": 16,
|
65 |
+
"trial_name": null,
|
66 |
+
"trial_params": null
|
67 |
+
}
|
Models/checkpoint-272/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:263a36c05af465e44b120f4d3dd83e89419bca7bdc701ed22ccf0495153e60ec
|
3 |
+
size 5368
|
Models/final_model/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1112205008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca3c01e4dca2372e12227f90b59e510a181423744f1f05fc605195a80bab6f10
|
3 |
size 1112205008
|
guiltbert_train_v2.xlsx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f64fc90cab04965d30a185c7edfca7f39e024c0dd994bd85071aab747fdb5ef8
|
3 |
+
size 254287
|
logs/events.out.tfevents.1744199527.0b7e6b5f708f.286.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3b67a59c3a4b32d8f6a6e7682e490e50d69b275a3ee57a6cb367d57866ab4f7
|
3 |
+
size 7568
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1112205008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca3c01e4dca2372e12227f90b59e510a181423744f1f05fc605195a80bab6f10
|
3 |
size 1112205008
|