ZhangYunchenY
commited on
Commit
·
2b5129f
1
Parent(s):
4f776f3
[Model] bert-base-uncased-mrpc
Browse files- config.json +21 -0
- flax_model.msgpack +3 -0
- pytorch_model.bin +3 -0
- special_tokens_map.json +1 -0
- tokenizer_config.json +1 -0
- train_args.json +25 -0
- training_args.bin +3 -0
- vocab.txt +0 -0
config.json
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"BertForSequenceClassification"
|
4 |
+
],
|
5 |
+
"attention_probs_dropout_prob": 0.1,
|
6 |
+
"finetuning_task": "glue:mrpc",
|
7 |
+
"gradient_checkpointing": false,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 768,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 3072,
|
13 |
+
"layer_norm_eps": 1e-12,
|
14 |
+
"max_position_embeddings": 512,
|
15 |
+
"model_type": "bert",
|
16 |
+
"num_attention_heads": 12,
|
17 |
+
"num_hidden_layers": 12,
|
18 |
+
"pad_token_id": 0,
|
19 |
+
"type_vocab_size": 2,
|
20 |
+
"vocab_size": 30522
|
21 |
+
}
|
flax_model.msgpack
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6bad8dd3140b4311d21788a48af3d0fb8e89836dda48feac82417b013855744
|
3 |
+
size 437942328
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21a7986a9000bb97d11204644f03ffe41975bc2686fd487052159709fa21c2ad
|
3 |
+
size 437985387
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"do_lower_case": true, "model_max_length": 512}
|
train_args.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model": "bert-base-uncased",
|
3 |
+
"dataset": "glue:mrpc",
|
4 |
+
"dataset_train_split": "train",
|
5 |
+
"dataset_dev_split": "validation",
|
6 |
+
"tb_writer_step": 1000,
|
7 |
+
"checkpoint_steps": -1,
|
8 |
+
"checkpoint_every_epoch": false,
|
9 |
+
"num_train_epochs": 5,
|
10 |
+
"early_stopping_epochs": -1,
|
11 |
+
"batch_size": 16,
|
12 |
+
"max_length": 256,
|
13 |
+
"learning_rate": 2e-05,
|
14 |
+
"grad_accum_steps": 1,
|
15 |
+
"warmup_proportion": 0.1,
|
16 |
+
"config_name": "config.json",
|
17 |
+
"weights_name": "pytorch_model.bin",
|
18 |
+
"enable_wandb": false,
|
19 |
+
"output_dir": "/p/qdata/jm8wx/research/text_attacks/textattack/outputs/training/bert-base-uncased-glue:mrpc-2020-06-29-12:04/",
|
20 |
+
"num_labels": 2,
|
21 |
+
"do_regression": false,
|
22 |
+
"best_eval_score": 0.8774509803921569,
|
23 |
+
"best_eval_score_epoch": 1,
|
24 |
+
"epochs_since_best_eval_score": 3
|
25 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa5000b32c859685e72c5f58fce286e71e954e939368cca75c7742ef5e3cc795
|
3 |
+
size 1052
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|