Add model and its dependencies

Browse files

Files changed (7) hide show

config.json +26 -0
experiments.log +33 -0
main_config.cfg +27 -0
merges.txt +0 -0
pytorch_model.bin +3 -0
training_args.bin +3 -0
vocab.json +0 -0

config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "_name_or_path": "roberta-base",
+  "architectures": [
+    "RobertaForMaskedLM"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "transformers_version": "4.2.2",
+  "type_vocab_size": 4,
+  "use_cache": true,
+  "vocab_size": 50265
+}

experiments.log ADDED Viewed

	@@ -0,0 +1,33 @@

+[56]2021-08-07 10:03:55,527: device: cuda n_gpu: 1
+[56]2021-08-07 10:06:49,449: ***** Running training *****
+[56]2021-08-07 10:06:49,449:   Batch size = 32
+[56]2021-08-07 10:06:49,449:   Num steps = 15015
+[56]2021-08-07 11:24:12,835: [epoch 1] ,lr: 1.5e-05 ,tr_loss: 2485.2335910126567
+[56]2021-08-07 11:24:34,745: ***** Running evaluation *****
+[56]2021-08-07 11:28:35,164:   acc = 0.8122634708956569
+[56]2021-08-07 11:28:35,164:   f1 = 0.3996542284973347
+[56]2021-08-07 11:28:35,164:   precision = 0.46873943899966203
+[56]2021-08-07 11:28:35,164:   recall = 0.3483174284279257
+[56]2021-08-07 12:44:45,042: [epoch 2] ,lr: 3e-05 ,tr_loss: 1232.1717670541257
+[56]2021-08-07 12:45:07,200: ***** Running evaluation *****
+[56]2021-08-07 12:49:07,609:   acc = 0.8737159848621373
+[56]2021-08-07 12:49:07,609:   f1 = 0.6822355741979367
+[56]2021-08-07 12:49:07,609:   precision = 0.6218226906385617
+[56]2021-08-07 12:49:07,609:   recall = 0.7556504269211451
+[56]2021-08-07 14:05:15,094: [epoch 3] ,lr: 0.0 ,tr_loss: 675.0315425428562
+[56]2021-08-07 14:05:37,318: ***** Running evaluation *****
+[56]2021-08-07 14:09:37,825:   acc = 0.9046224544963056
+[56]2021-08-07 14:09:37,825:   f1 = 0.7179965365658719
+[56]2021-08-07 14:09:37,825:   precision = 0.7645390070921986
+[56]2021-08-07 14:09:37,825:   recall = 0.6767955801104972
+[56]2021-08-07 14:09:39,472: -----Best Result-----
+[56]2021-08-07 14:09:39,472:   acc = 0.9046224544963056
+[56]2021-08-07 14:09:39,472:   f1 = 0.7179965365658719
+[56]2021-08-07 14:09:39,472:   precision = 0.7645390070921986
+[56]2021-08-07 14:09:39,472:   recall = 0.6767955801104972
+[56]2021-08-07 14:10:01,830: ***** Running evaluation *****
+[56]2021-08-07 14:14:02,303:   acc = 0.9046224544963056
+[56]2021-08-07 14:14:02,304:   f1 = 0.7179965365658719
+[56]2021-08-07 14:14:02,304:   precision = 0.7645390070921986
+[56]2021-08-07 14:14:02,304:   recall = 0.6767955801104972
+[56]2021-08-07 14:14:02,304: Saved to saves/roberta-base/2_20210807-1003

main_config.cfg ADDED Viewed

	@@ -0,0 +1,27 @@

+[args]
+bert_model=roberta-base
+data_dir=VUA20
+task_name=vua
+model_type=MELBERT
+classifier_hidden=768
+lr_schedule=warmup_linear
+warmup_epoch=2
+drop_ratio=0.2
+kfold=10
+num_bagging=0
+bagging_index=0
+use_pos=True
+use_local_context=True
+max_seq_length=150
+do_train=True
+do_test=True
+do_eval=True
+do_lower_case=False
+class_weight=3
+train_batch_size=32
+eval_batch_size=8
+learning_rate=3e-05
+num_train_epoch=3
+no_cuda=False
+seed=42

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ceef59e211e065a7c50e7dbb7cb2e3f2ea8ffa1ecc19c5e0646406b880963de5
+size 508139373

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4782e64d86a5a2a6eaad688e9cf07aef3df6805304c80e2315c8f8d1258dd57
+size 1327

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff