LA on cola
Browse files- outputs/args.json +47 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/prior_precision_kron_all_homo_1000.pt +3 -0
outputs/args.json
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"task_name": "cola",
|
3 |
+
"train_file": null,
|
4 |
+
"validation_file": null,
|
5 |
+
"max_length": 256,
|
6 |
+
"pad_to_max_length": false,
|
7 |
+
"model_name_or_path": "google-bert/bert-base-uncased",
|
8 |
+
"use_slow_tokenizer": true,
|
9 |
+
"per_device_train_batch_size": 8,
|
10 |
+
"per_device_eval_batch_size": 8,
|
11 |
+
"learning_rate": 5e-05,
|
12 |
+
"weight_decay": 0.0,
|
13 |
+
"num_train_epochs": 5,
|
14 |
+
"max_train_steps": null,
|
15 |
+
"gradient_accumulation_steps": 1,
|
16 |
+
"lr_scheduler_type": "linear",
|
17 |
+
"num_warmup_steps": 0,
|
18 |
+
"output_dir": "./outputs",
|
19 |
+
"peft_method": null,
|
20 |
+
"seed": 42,
|
21 |
+
"push_to_hub": false,
|
22 |
+
"hub_model_id": null,
|
23 |
+
"hub_token": null,
|
24 |
+
"checkpointing_steps": "1000",
|
25 |
+
"resume_from_checkpoint": null,
|
26 |
+
"with_tracking": false,
|
27 |
+
"report_to": "all",
|
28 |
+
"ignore_mismatched_sizes": true,
|
29 |
+
"save": false,
|
30 |
+
"load_step": 999,
|
31 |
+
"laplace_hessian": "kron",
|
32 |
+
"laplace_sub": "all",
|
33 |
+
"laplace_prior": "homo",
|
34 |
+
"laplace_optim_step": 1000,
|
35 |
+
"testing_set": "val",
|
36 |
+
"laplace_predict": "mc_corr",
|
37 |
+
"lm_head": false,
|
38 |
+
"cache_dir": "/content/cache/huggingface/metrics/glue",
|
39 |
+
"step_list": [
|
40 |
+
0,
|
41 |
+
1068,
|
42 |
+
2137,
|
43 |
+
3206,
|
44 |
+
4275,
|
45 |
+
5344
|
46 |
+
]
|
47 |
+
}
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_matthews_correlation": 0.01486714832435204}
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_matthews_correlation": 0.46484295300587036}
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_matthews_correlation": 0.5072753983504138}
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_matthews_correlation": 0.5152882228132933}
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_matthews_correlation": 0.5127766293248668}
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_matthews_correlation": 0.5073548497499728}
|
outputs/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/f_mu_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:203a7b4f06680c1f148d35614d77e524a04429f7a7a7bfd560604d9a680d3e1f
|
3 |
+
size 9644
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/f_var_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6497e3165d2474a55fc3680100e49d8aeea9122dc45141113513d87135284373
|
3 |
+
size 18033
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_0/prior_precision_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70293dc63149b212d9909341057cba43e85c91db4a062169c3ec1afcc4b480fd
|
3 |
+
size 1379
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/f_mu_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9342bc5e6bc3048582040e3c3b97cca265c5fc46aa7855afe08bb4700471e26
|
3 |
+
size 9644
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/f_var_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aea76c439e56afd5a2802061a69f99f0f83ae30bd532666ea2031c34a06a980b
|
3 |
+
size 18033
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_1068/prior_precision_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17621686933193907d927cdd895971ebe56424f216872585daf2b308ba9ce175
|
3 |
+
size 1379
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/f_mu_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21b9e12e2d267c48633ffeb9f1b06c483a1c9aef1a531f825f57d3efac350cfa
|
3 |
+
size 9644
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/f_var_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:509fb9f2005cd2f26b0288ed7b4514fbb0108e321a43ed78757c251689bf3e78
|
3 |
+
size 18033
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_2137/prior_precision_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:484b2af776ef15b6481462d67ec7a52a60ee79ea5bc081b10697a9f6c225b04e
|
3 |
+
size 1379
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/f_mu_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:992d32a39dc00901320b10809088d7868bc6e81125f9ec0a56ea8799f72e5062
|
3 |
+
size 9644
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/f_var_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1257b3cbf8e863ea649b2bfba2d59de9765048247847a7b1b00aaf4de056d51e
|
3 |
+
size 18033
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_3206/prior_precision_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32f262b79c63ef923eba180cfaf0a766fb8292cd8ff14cc48d373b0f701d803e
|
3 |
+
size 1379
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/f_mu_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:125ce209445309ba61b6a002256320df0dfc28b1f3653a06af3dd6509144bb15
|
3 |
+
size 9644
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/f_var_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:622b4492b70532b3768091a23b2d2ce9b2ea11915873f8ad795d7b2ab66c493d
|
3 |
+
size 18033
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_4275/prior_precision_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d9c4f11d19f9abb61aecaa6116a09f9548034d7642ddcd2438939346e01c291
|
3 |
+
size 1379
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/f_mu_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17b302ed47298212d9d3fb720acf0ce3a1cd08f4c8996849c03cc56b85a093b7
|
3 |
+
size 9644
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/f_var_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d98a9ba303de7fd5afd3214208b6cad22ca8ee65c13a684671e942efdec8e4ee
|
3 |
+
size 18033
|
outputs_laplace/cola/google-bert/bert-base-uncased_adapters_5e-05_42/step_5344/prior_precision_kron_all_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8d2f2eb2c1d5f0bbb6b0b4ed062f4209c84e1bb0424c331726eb25163d69ee5
|
3 |
+
size 1379
|