lllaplace
Browse filesThis view is limited to 50 files because it contains too many changes. Β
See raw diff
- outputs/qqp/args.json +42 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/README.md +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_config.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_model.safetensors +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_last_layer_homo_mc_corr_1000.json +1 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_last_layer_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/gpu_stats.json +127 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/special_tokens_map.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer_config.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/vocab.txt +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/README.md +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_config.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_model.safetensors +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_last_layer_homo_mc_corr_1000.json +1 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_last_layer_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/gpu_stats.json +127 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/special_tokens_map.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer_config.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/vocab.txt +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/README.md +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_config.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_model.safetensors +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_last_layer_homo_mc_corr_1000.json +1 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_last_layer_homo_mc_corr_1000.json +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/gpu_stats.json +127 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/special_tokens_map.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer_config.json +0 -0
- outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/vocab.txt +0 -0
- outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/steps.json +5 -0
- outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_mu_kron_last_layer_homo_1000.pt +3 -0
- outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_var_kron_last_layer_homo_1000.pt +3 -0
- outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/prior_precision_kron_last_layer_homo_1000.pt +3 -0
- outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_mu_kron_last_layer_homo_1000.pt +3 -0
- outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_var_kron_last_layer_homo_1000.pt +3 -0
- outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/prior_precision_kron_last_layer_homo_1000.pt +3 -0
outputs/qqp/args.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"task_name": "qqp",
|
3 |
+
"train_file": null,
|
4 |
+
"validation_file": null,
|
5 |
+
"max_length": 256,
|
6 |
+
"pad_to_max_length": false,
|
7 |
+
"model_name_or_path": "google-bert/bert-base-uncased",
|
8 |
+
"use_slow_tokenizer": false,
|
9 |
+
"per_device_train_batch_size": 32,
|
10 |
+
"per_device_eval_batch_size": 32,
|
11 |
+
"learning_rate": 5e-05,
|
12 |
+
"weight_decay": 0.0,
|
13 |
+
"num_train_epochs": 5,
|
14 |
+
"max_train_steps": null,
|
15 |
+
"gradient_accumulation_steps": 1,
|
16 |
+
"lr_scheduler_type": "linear",
|
17 |
+
"num_warmup_steps": 0,
|
18 |
+
"output_dir": "./outputs",
|
19 |
+
"peft_method": null,
|
20 |
+
"seed": 42,
|
21 |
+
"push_to_hub": false,
|
22 |
+
"hub_model_id": null,
|
23 |
+
"hub_token": null,
|
24 |
+
"checkpointing_steps": "1000",
|
25 |
+
"resume_from_checkpoint": null,
|
26 |
+
"with_tracking": false,
|
27 |
+
"report_to": "all",
|
28 |
+
"ignore_mismatched_sizes": true,
|
29 |
+
"save": false,
|
30 |
+
"load_step": 999,
|
31 |
+
"lora_r": 8,
|
32 |
+
"lora_alpha": 16,
|
33 |
+
"lora_dropout": 0.1,
|
34 |
+
"laplace_hessian": "kron",
|
35 |
+
"laplace_sub": "last_layer",
|
36 |
+
"laplace_prior": "homo",
|
37 |
+
"laplace_optim_step": 1000,
|
38 |
+
"testing_set": "val",
|
39 |
+
"laplace_predict": "mc_corr",
|
40 |
+
"lm_head": true,
|
41 |
+
"cache_dir": "/content/cache/huggingface/metrics/"
|
42 |
+
}
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/README.md
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_config.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_model.safetensors
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_all_homo_mc_corr_1000.json
RENAMED
File without changes
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_last_layer_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_accuracy": 0.3999752658916646, "eval_f1": 0.5510003886801532}
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json
RENAMED
File without changes
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_last_layer_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/gpu_stats.json
ADDED
@@ -0,0 +1,127 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"memory_allocated": 2368281600,
|
3 |
+
"max_memory_allocated": 2743742464,
|
4 |
+
"memory_reserved": 3382706176,
|
5 |
+
"max_memory_reserved": 3382706176,
|
6 |
+
"memory_stats": {
|
7 |
+
"active.all.allocated": 6631649,
|
8 |
+
"active.all.current": 3220,
|
9 |
+
"active.all.freed": 6628429,
|
10 |
+
"active.all.peak": 3230,
|
11 |
+
"active.large_pool.allocated": 4004527,
|
12 |
+
"active.large_pool.current": 274,
|
13 |
+
"active.large_pool.freed": 4004253,
|
14 |
+
"active.large_pool.peak": 283,
|
15 |
+
"active.small_pool.allocated": 2627122,
|
16 |
+
"active.small_pool.current": 2946,
|
17 |
+
"active.small_pool.freed": 2624176,
|
18 |
+
"active.small_pool.peak": 2955,
|
19 |
+
"active_bytes.all.allocated": 35764172915712,
|
20 |
+
"active_bytes.all.current": 2368281600,
|
21 |
+
"active_bytes.all.freed": 35761804634112,
|
22 |
+
"active_bytes.all.peak": 2743742464,
|
23 |
+
"active_bytes.large_pool.allocated": 34749907407872,
|
24 |
+
"active_bytes.large_pool.current": 2360377344,
|
25 |
+
"active_bytes.large_pool.freed": 34747547030528,
|
26 |
+
"active_bytes.large_pool.peak": 2737864704,
|
27 |
+
"active_bytes.small_pool.allocated": 1014265507840,
|
28 |
+
"active_bytes.small_pool.current": 7904256,
|
29 |
+
"active_bytes.small_pool.freed": 1014257603584,
|
30 |
+
"active_bytes.small_pool.peak": 11914240,
|
31 |
+
"allocated_bytes.all.allocated": 35764172915712,
|
32 |
+
"allocated_bytes.all.current": 2368281600,
|
33 |
+
"allocated_bytes.all.freed": 35761804634112,
|
34 |
+
"allocated_bytes.all.peak": 2743742464,
|
35 |
+
"allocated_bytes.large_pool.allocated": 34749907407872,
|
36 |
+
"allocated_bytes.large_pool.current": 2360377344,
|
37 |
+
"allocated_bytes.large_pool.freed": 34747547030528,
|
38 |
+
"allocated_bytes.large_pool.peak": 2737864704,
|
39 |
+
"allocated_bytes.small_pool.allocated": 1014265507840,
|
40 |
+
"allocated_bytes.small_pool.current": 7904256,
|
41 |
+
"allocated_bytes.small_pool.freed": 1014257603584,
|
42 |
+
"allocated_bytes.small_pool.peak": 11914240,
|
43 |
+
"allocation.all.allocated": 6631649,
|
44 |
+
"allocation.all.current": 3220,
|
45 |
+
"allocation.all.freed": 6628429,
|
46 |
+
"allocation.all.peak": 3230,
|
47 |
+
"allocation.large_pool.allocated": 4004527,
|
48 |
+
"allocation.large_pool.current": 274,
|
49 |
+
"allocation.large_pool.freed": 4004253,
|
50 |
+
"allocation.large_pool.peak": 283,
|
51 |
+
"allocation.small_pool.allocated": 2627122,
|
52 |
+
"allocation.small_pool.current": 2946,
|
53 |
+
"allocation.small_pool.freed": 2624176,
|
54 |
+
"allocation.small_pool.peak": 2955,
|
55 |
+
"inactive_split.all.allocated": 4292575,
|
56 |
+
"inactive_split.all.current": 116,
|
57 |
+
"inactive_split.all.freed": 4292459,
|
58 |
+
"inactive_split.all.peak": 131,
|
59 |
+
"inactive_split.large_pool.allocated": 2703344,
|
60 |
+
"inactive_split.large_pool.current": 109,
|
61 |
+
"inactive_split.large_pool.freed": 2703235,
|
62 |
+
"inactive_split.large_pool.peak": 118,
|
63 |
+
"inactive_split.small_pool.allocated": 1589231,
|
64 |
+
"inactive_split.small_pool.current": 7,
|
65 |
+
"inactive_split.small_pool.freed": 1589224,
|
66 |
+
"inactive_split.small_pool.peak": 17,
|
67 |
+
"inactive_split_bytes.all.allocated": 30727348120064,
|
68 |
+
"inactive_split_bytes.all.current": 408347648,
|
69 |
+
"inactive_split_bytes.all.freed": 30726939772416,
|
70 |
+
"inactive_split_bytes.all.peak": 582270464,
|
71 |
+
"inactive_split_bytes.large_pool.allocated": 29710313588224,
|
72 |
+
"inactive_split_bytes.large_pool.current": 407863296,
|
73 |
+
"inactive_split_bytes.large_pool.freed": 29709905724928,
|
74 |
+
"inactive_split_bytes.large_pool.peak": 581795840,
|
75 |
+
"inactive_split_bytes.small_pool.allocated": 1017034531840,
|
76 |
+
"inactive_split_bytes.small_pool.current": 484352,
|
77 |
+
"inactive_split_bytes.small_pool.freed": 1017034047488,
|
78 |
+
"inactive_split_bytes.small_pool.peak": 5708800,
|
79 |
+
"max_split_size": -1,
|
80 |
+
"num_alloc_retries": 0,
|
81 |
+
"num_ooms": 0,
|
82 |
+
"oversize_allocations.allocated": 0,
|
83 |
+
"oversize_allocations.current": 0,
|
84 |
+
"oversize_allocations.freed": 0,
|
85 |
+
"oversize_allocations.peak": 0,
|
86 |
+
"oversize_segments.allocated": 0,
|
87 |
+
"oversize_segments.current": 0,
|
88 |
+
"oversize_segments.freed": 0,
|
89 |
+
"oversize_segments.peak": 0,
|
90 |
+
"requested_bytes.all.allocated": 34988260561798,
|
91 |
+
"requested_bytes.all.current": 2365680124,
|
92 |
+
"requested_bytes.all.freed": 34985894881674,
|
93 |
+
"requested_bytes.all.peak": 2741468112,
|
94 |
+
"requested_bytes.large_pool.allocated": 33974373525760,
|
95 |
+
"requested_bytes.large_pool.current": 2358112256,
|
96 |
+
"requested_bytes.large_pool.freed": 33972015413504,
|
97 |
+
"requested_bytes.large_pool.peak": 2735599616,
|
98 |
+
"requested_bytes.small_pool.allocated": 1013887036038,
|
99 |
+
"requested_bytes.small_pool.current": 7567868,
|
100 |
+
"requested_bytes.small_pool.freed": 1013879468170,
|
101 |
+
"requested_bytes.small_pool.peak": 11904040,
|
102 |
+
"reserved_bytes.all.allocated": 3873439744,
|
103 |
+
"reserved_bytes.all.current": 3382706176,
|
104 |
+
"reserved_bytes.all.freed": 490733568,
|
105 |
+
"reserved_bytes.all.peak": 3382706176,
|
106 |
+
"reserved_bytes.large_pool.allocated": 3856662528,
|
107 |
+
"reserved_bytes.large_pool.current": 3374317568,
|
108 |
+
"reserved_bytes.large_pool.freed": 482344960,
|
109 |
+
"reserved_bytes.large_pool.peak": 3374317568,
|
110 |
+
"reserved_bytes.small_pool.allocated": 16777216,
|
111 |
+
"reserved_bytes.small_pool.current": 8388608,
|
112 |
+
"reserved_bytes.small_pool.freed": 8388608,
|
113 |
+
"reserved_bytes.small_pool.peak": 14680064,
|
114 |
+
"segment.all.allocated": 145,
|
115 |
+
"segment.all.current": 129,
|
116 |
+
"segment.all.freed": 16,
|
117 |
+
"segment.all.peak": 132,
|
118 |
+
"segment.large_pool.allocated": 137,
|
119 |
+
"segment.large_pool.current": 125,
|
120 |
+
"segment.large_pool.freed": 12,
|
121 |
+
"segment.large_pool.peak": 125,
|
122 |
+
"segment.small_pool.allocated": 8,
|
123 |
+
"segment.small_pool.current": 4,
|
124 |
+
"segment.small_pool.freed": 4,
|
125 |
+
"segment.small_pool.peak": 7
|
126 |
+
}
|
127 |
+
}
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/special_tokens_map.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer_config.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/vocab.txt
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/README.md
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_config.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_model.safetensors
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_all_homo_mc_corr_1000.json
RENAMED
File without changes
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_last_layer_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_accuracy": 0.8454860252287905, "eval_f1": 0.7988278105175024}
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_all_homo_mc_corr_1000.json
RENAMED
File without changes
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_last_layer_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/gpu_stats.json
ADDED
@@ -0,0 +1,127 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"memory_allocated": 2368412672,
|
3 |
+
"max_memory_allocated": 2743873536,
|
4 |
+
"memory_reserved": 3361734656,
|
5 |
+
"max_memory_reserved": 3382706176,
|
6 |
+
"memory_stats": {
|
7 |
+
"active.all.allocated": 13263297,
|
8 |
+
"active.all.current": 3220,
|
9 |
+
"active.all.freed": 13260077,
|
10 |
+
"active.all.peak": 3230,
|
11 |
+
"active.large_pool.allocated": 8009052,
|
12 |
+
"active.large_pool.current": 274,
|
13 |
+
"active.large_pool.freed": 8008778,
|
14 |
+
"active.large_pool.peak": 283,
|
15 |
+
"active.small_pool.allocated": 5254245,
|
16 |
+
"active.small_pool.current": 2946,
|
17 |
+
"active.small_pool.freed": 5251299,
|
18 |
+
"active.small_pool.peak": 2955,
|
19 |
+
"active_bytes.all.allocated": 71465896812544,
|
20 |
+
"active_bytes.all.current": 2368412672,
|
21 |
+
"active_bytes.all.freed": 71463528399872,
|
22 |
+
"active_bytes.all.peak": 2743873536,
|
23 |
+
"active_bytes.large_pool.allocated": 69437365796352,
|
24 |
+
"active_bytes.large_pool.current": 2360508416,
|
25 |
+
"active_bytes.large_pool.freed": 69435005287936,
|
26 |
+
"active_bytes.large_pool.peak": 2737995776,
|
27 |
+
"active_bytes.small_pool.allocated": 2028531016192,
|
28 |
+
"active_bytes.small_pool.current": 7904256,
|
29 |
+
"active_bytes.small_pool.freed": 2028523111936,
|
30 |
+
"active_bytes.small_pool.peak": 11914240,
|
31 |
+
"allocated_bytes.all.allocated": 71465896812544,
|
32 |
+
"allocated_bytes.all.current": 2368412672,
|
33 |
+
"allocated_bytes.all.freed": 71463528399872,
|
34 |
+
"allocated_bytes.all.peak": 2743873536,
|
35 |
+
"allocated_bytes.large_pool.allocated": 69437365796352,
|
36 |
+
"allocated_bytes.large_pool.current": 2360508416,
|
37 |
+
"allocated_bytes.large_pool.freed": 69435005287936,
|
38 |
+
"allocated_bytes.large_pool.peak": 2737995776,
|
39 |
+
"allocated_bytes.small_pool.allocated": 2028531016192,
|
40 |
+
"allocated_bytes.small_pool.current": 7904256,
|
41 |
+
"allocated_bytes.small_pool.freed": 2028523111936,
|
42 |
+
"allocated_bytes.small_pool.peak": 11914240,
|
43 |
+
"allocation.all.allocated": 13263297,
|
44 |
+
"allocation.all.current": 3220,
|
45 |
+
"allocation.all.freed": 13260077,
|
46 |
+
"allocation.all.peak": 3230,
|
47 |
+
"allocation.large_pool.allocated": 8009052,
|
48 |
+
"allocation.large_pool.current": 274,
|
49 |
+
"allocation.large_pool.freed": 8008778,
|
50 |
+
"allocation.large_pool.peak": 283,
|
51 |
+
"allocation.small_pool.allocated": 5254245,
|
52 |
+
"allocation.small_pool.current": 2946,
|
53 |
+
"allocation.small_pool.freed": 5251299,
|
54 |
+
"allocation.small_pool.peak": 2955,
|
55 |
+
"inactive_split.all.allocated": 9056214,
|
56 |
+
"inactive_split.all.current": 117,
|
57 |
+
"inactive_split.all.freed": 9056097,
|
58 |
+
"inactive_split.all.peak": 758,
|
59 |
+
"inactive_split.large_pool.allocated": 5877807,
|
60 |
+
"inactive_split.large_pool.current": 108,
|
61 |
+
"inactive_split.large_pool.freed": 5877699,
|
62 |
+
"inactive_split.large_pool.peak": 118,
|
63 |
+
"inactive_split.small_pool.allocated": 3178407,
|
64 |
+
"inactive_split.small_pool.current": 9,
|
65 |
+
"inactive_split.small_pool.freed": 3178398,
|
66 |
+
"inactive_split.small_pool.peak": 649,
|
67 |
+
"inactive_split_bytes.all.allocated": 61796334381056,
|
68 |
+
"inactive_split_bytes.all.current": 387245056,
|
69 |
+
"inactive_split_bytes.all.freed": 61795947136000,
|
70 |
+
"inactive_split_bytes.all.peak": 582270464,
|
71 |
+
"inactive_split_bytes.large_pool.allocated": 59762423342592,
|
72 |
+
"inactive_split_bytes.large_pool.current": 386760704,
|
73 |
+
"inactive_split_bytes.large_pool.freed": 59762036581888,
|
74 |
+
"inactive_split_bytes.large_pool.peak": 581795840,
|
75 |
+
"inactive_split_bytes.small_pool.allocated": 2033911038464,
|
76 |
+
"inactive_split_bytes.small_pool.current": 484352,
|
77 |
+
"inactive_split_bytes.small_pool.freed": 2033910554112,
|
78 |
+
"inactive_split_bytes.small_pool.peak": 6297600,
|
79 |
+
"max_split_size": -1,
|
80 |
+
"num_alloc_retries": 0,
|
81 |
+
"num_ooms": 0,
|
82 |
+
"oversize_allocations.allocated": 0,
|
83 |
+
"oversize_allocations.current": 0,
|
84 |
+
"oversize_allocations.freed": 0,
|
85 |
+
"oversize_allocations.peak": 0,
|
86 |
+
"oversize_segments.allocated": 0,
|
87 |
+
"oversize_segments.current": 0,
|
88 |
+
"oversize_segments.freed": 0,
|
89 |
+
"oversize_segments.peak": 0,
|
90 |
+
"requested_bytes.all.allocated": 69976504084237,
|
91 |
+
"requested_bytes.all.current": 2365680124,
|
92 |
+
"requested_bytes.all.freed": 69974138404113,
|
93 |
+
"requested_bytes.all.peak": 2741468112,
|
94 |
+
"requested_bytes.large_pool.allocated": 67948730012160,
|
95 |
+
"requested_bytes.large_pool.current": 2358112256,
|
96 |
+
"requested_bytes.large_pool.freed": 67946371899904,
|
97 |
+
"requested_bytes.large_pool.peak": 2735599616,
|
98 |
+
"requested_bytes.small_pool.allocated": 2027774072077,
|
99 |
+
"requested_bytes.small_pool.current": 7567868,
|
100 |
+
"requested_bytes.small_pool.freed": 2027766504209,
|
101 |
+
"requested_bytes.small_pool.peak": 11904040,
|
102 |
+
"reserved_bytes.all.allocated": 4970250240,
|
103 |
+
"reserved_bytes.all.current": 3361734656,
|
104 |
+
"reserved_bytes.all.freed": 1608515584,
|
105 |
+
"reserved_bytes.all.peak": 3382706176,
|
106 |
+
"reserved_bytes.large_pool.allocated": 4945084416,
|
107 |
+
"reserved_bytes.large_pool.current": 3353346048,
|
108 |
+
"reserved_bytes.large_pool.freed": 1591738368,
|
109 |
+
"reserved_bytes.large_pool.peak": 3374317568,
|
110 |
+
"reserved_bytes.small_pool.allocated": 25165824,
|
111 |
+
"reserved_bytes.small_pool.current": 8388608,
|
112 |
+
"reserved_bytes.small_pool.freed": 16777216,
|
113 |
+
"reserved_bytes.small_pool.peak": 14680064,
|
114 |
+
"segment.all.allocated": 173,
|
115 |
+
"segment.all.current": 128,
|
116 |
+
"segment.all.freed": 45,
|
117 |
+
"segment.all.peak": 132,
|
118 |
+
"segment.large_pool.allocated": 161,
|
119 |
+
"segment.large_pool.current": 124,
|
120 |
+
"segment.large_pool.freed": 37,
|
121 |
+
"segment.large_pool.peak": 125,
|
122 |
+
"segment.small_pool.allocated": 12,
|
123 |
+
"segment.small_pool.current": 4,
|
124 |
+
"segment.small_pool.freed": 8,
|
125 |
+
"segment.small_pool.peak": 7
|
126 |
+
}
|
127 |
+
}
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/special_tokens_map.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer_config.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/vocab.txt
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/README.md
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_config.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_model.safetensors
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_all_homo_mc_corr_1000.json
RENAMED
File without changes
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_last_layer_homo_mc_corr_1000.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_accuracy": 0.8571357902547613, "eval_f1": 0.8090073407843396}
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_all_homo_mc_corr_1000.json
RENAMED
File without changes
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_last_layer_homo_mc_corr_1000.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/gpu_stats.json
ADDED
@@ -0,0 +1,127 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"memory_allocated": 2368412672,
|
3 |
+
"max_memory_allocated": 2743873536,
|
4 |
+
"memory_reserved": 3363831808,
|
5 |
+
"max_memory_reserved": 3382706176,
|
6 |
+
"memory_stats": {
|
7 |
+
"active.all.allocated": 19894944,
|
8 |
+
"active.all.current": 3220,
|
9 |
+
"active.all.freed": 19891724,
|
10 |
+
"active.all.peak": 3230,
|
11 |
+
"active.large_pool.allocated": 12013577,
|
12 |
+
"active.large_pool.current": 274,
|
13 |
+
"active.large_pool.freed": 12013303,
|
14 |
+
"active.large_pool.peak": 283,
|
15 |
+
"active.small_pool.allocated": 7881367,
|
16 |
+
"active.small_pool.current": 2946,
|
17 |
+
"active.small_pool.freed": 7878421,
|
18 |
+
"active.small_pool.peak": 2955,
|
19 |
+
"active_bytes.all.allocated": 107167620708864,
|
20 |
+
"active_bytes.all.current": 2368412672,
|
21 |
+
"active_bytes.all.freed": 107165252296192,
|
22 |
+
"active_bytes.all.peak": 2743873536,
|
23 |
+
"active_bytes.large_pool.allocated": 104124824184832,
|
24 |
+
"active_bytes.large_pool.current": 2360508416,
|
25 |
+
"active_bytes.large_pool.freed": 104122463676416,
|
26 |
+
"active_bytes.large_pool.peak": 2737995776,
|
27 |
+
"active_bytes.small_pool.allocated": 3042796524032,
|
28 |
+
"active_bytes.small_pool.current": 7904256,
|
29 |
+
"active_bytes.small_pool.freed": 3042788619776,
|
30 |
+
"active_bytes.small_pool.peak": 11914240,
|
31 |
+
"allocated_bytes.all.allocated": 107167620708864,
|
32 |
+
"allocated_bytes.all.current": 2368412672,
|
33 |
+
"allocated_bytes.all.freed": 107165252296192,
|
34 |
+
"allocated_bytes.all.peak": 2743873536,
|
35 |
+
"allocated_bytes.large_pool.allocated": 104124824184832,
|
36 |
+
"allocated_bytes.large_pool.current": 2360508416,
|
37 |
+
"allocated_bytes.large_pool.freed": 104122463676416,
|
38 |
+
"allocated_bytes.large_pool.peak": 2737995776,
|
39 |
+
"allocated_bytes.small_pool.allocated": 3042796524032,
|
40 |
+
"allocated_bytes.small_pool.current": 7904256,
|
41 |
+
"allocated_bytes.small_pool.freed": 3042788619776,
|
42 |
+
"allocated_bytes.small_pool.peak": 11914240,
|
43 |
+
"allocation.all.allocated": 19894944,
|
44 |
+
"allocation.all.current": 3220,
|
45 |
+
"allocation.all.freed": 19891724,
|
46 |
+
"allocation.all.peak": 3230,
|
47 |
+
"allocation.large_pool.allocated": 12013577,
|
48 |
+
"allocation.large_pool.current": 274,
|
49 |
+
"allocation.large_pool.freed": 12013303,
|
50 |
+
"allocation.large_pool.peak": 283,
|
51 |
+
"allocation.small_pool.allocated": 7881367,
|
52 |
+
"allocation.small_pool.current": 2946,
|
53 |
+
"allocation.small_pool.freed": 7878421,
|
54 |
+
"allocation.small_pool.peak": 2955,
|
55 |
+
"inactive_split.all.allocated": 13817601,
|
56 |
+
"inactive_split.all.current": 115,
|
57 |
+
"inactive_split.all.freed": 13817486,
|
58 |
+
"inactive_split.all.peak": 773,
|
59 |
+
"inactive_split.large_pool.allocated": 9052286,
|
60 |
+
"inactive_split.large_pool.current": 108,
|
61 |
+
"inactive_split.large_pool.freed": 9052178,
|
62 |
+
"inactive_split.large_pool.peak": 118,
|
63 |
+
"inactive_split.small_pool.allocated": 4765315,
|
64 |
+
"inactive_split.small_pool.current": 7,
|
65 |
+
"inactive_split.small_pool.freed": 4765308,
|
66 |
+
"inactive_split.small_pool.peak": 665,
|
67 |
+
"inactive_split_bytes.all.allocated": 92865379165184,
|
68 |
+
"inactive_split_bytes.all.current": 387245056,
|
69 |
+
"inactive_split_bytes.all.freed": 92864991920128,
|
70 |
+
"inactive_split_bytes.all.peak": 582270464,
|
71 |
+
"inactive_split_bytes.large_pool.allocated": 89814591620608,
|
72 |
+
"inactive_split_bytes.large_pool.current": 386760704,
|
73 |
+
"inactive_split_bytes.large_pool.freed": 89814204859904,
|
74 |
+
"inactive_split_bytes.large_pool.peak": 581795840,
|
75 |
+
"inactive_split_bytes.small_pool.allocated": 3050787544576,
|
76 |
+
"inactive_split_bytes.small_pool.current": 484352,
|
77 |
+
"inactive_split_bytes.small_pool.freed": 3050787060224,
|
78 |
+
"inactive_split_bytes.small_pool.peak": 6297600,
|
79 |
+
"max_split_size": -1,
|
80 |
+
"num_alloc_retries": 0,
|
81 |
+
"num_ooms": 0,
|
82 |
+
"oversize_allocations.allocated": 0,
|
83 |
+
"oversize_allocations.current": 0,
|
84 |
+
"oversize_allocations.freed": 0,
|
85 |
+
"oversize_allocations.peak": 0,
|
86 |
+
"oversize_segments.allocated": 0,
|
87 |
+
"oversize_segments.current": 0,
|
88 |
+
"oversize_segments.freed": 0,
|
89 |
+
"oversize_segments.peak": 0,
|
90 |
+
"requested_bytes.all.allocated": 104964747606675,
|
91 |
+
"requested_bytes.all.current": 2365680124,
|
92 |
+
"requested_bytes.all.freed": 104962381926551,
|
93 |
+
"requested_bytes.all.peak": 2741468112,
|
94 |
+
"requested_bytes.large_pool.allocated": 101923086498560,
|
95 |
+
"requested_bytes.large_pool.current": 2358112256,
|
96 |
+
"requested_bytes.large_pool.freed": 101920728386304,
|
97 |
+
"requested_bytes.large_pool.peak": 2735599616,
|
98 |
+
"requested_bytes.small_pool.allocated": 3041661108115,
|
99 |
+
"requested_bytes.small_pool.current": 7567868,
|
100 |
+
"requested_bytes.small_pool.freed": 3041653540247,
|
101 |
+
"requested_bytes.small_pool.peak": 11904040,
|
102 |
+
"reserved_bytes.all.allocated": 6090129408,
|
103 |
+
"reserved_bytes.all.current": 3363831808,
|
104 |
+
"reserved_bytes.all.freed": 2726297600,
|
105 |
+
"reserved_bytes.all.peak": 3382706176,
|
106 |
+
"reserved_bytes.large_pool.allocated": 6054477824,
|
107 |
+
"reserved_bytes.large_pool.current": 3353346048,
|
108 |
+
"reserved_bytes.large_pool.freed": 2701131776,
|
109 |
+
"reserved_bytes.large_pool.peak": 3374317568,
|
110 |
+
"reserved_bytes.small_pool.allocated": 35651584,
|
111 |
+
"reserved_bytes.small_pool.current": 10485760,
|
112 |
+
"reserved_bytes.small_pool.freed": 25165824,
|
113 |
+
"reserved_bytes.small_pool.peak": 14680064,
|
114 |
+
"segment.all.allocated": 203,
|
115 |
+
"segment.all.current": 129,
|
116 |
+
"segment.all.freed": 74,
|
117 |
+
"segment.all.peak": 132,
|
118 |
+
"segment.large_pool.allocated": 186,
|
119 |
+
"segment.large_pool.current": 124,
|
120 |
+
"segment.large_pool.freed": 62,
|
121 |
+
"segment.large_pool.peak": 125,
|
122 |
+
"segment.small_pool.allocated": 17,
|
123 |
+
"segment.small_pool.current": 5,
|
124 |
+
"segment.small_pool.freed": 12,
|
125 |
+
"segment.small_pool.peak": 7
|
126 |
+
}
|
127 |
+
}
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/special_tokens_map.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer_config.json
RENAMED
File without changes
|
outputs/{google-bert β qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/vocab.txt
RENAMED
File without changes
|
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/steps.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
0,
|
3 |
+
27288,
|
4 |
+
54577
|
5 |
+
]
|
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_mu_kron_last_layer_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bd24e936219cd2fdf79a74002fd93b9526dfab8212c81ddd2254df563da5a0f
|
3 |
+
size 324815
|
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_var_kron_last_layer_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dc593ffbad0f4ee51cdc02fbe9ff33aaf44214ef472668b8dc62ef7ebbd0850
|
3 |
+
size 648212
|
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/prior_precision_kron_last_layer_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61efa51d7df9d4cd224a805e15b8be2673cc94e0c225867cff51f76b8962039a
|
3 |
+
size 1414
|
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_mu_kron_last_layer_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e9e2a94742c11148a07991cdda0b0f8d34d0c81bef4e336dc1ea171a63311f3
|
3 |
+
size 324815
|
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_var_kron_last_layer_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71c7b83a790e3a6d1677fa2f4dcbc31a962d94d95b25cbdd25ff9be5bc2f3171
|
3 |
+
size 648212
|
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/prior_precision_kron_last_layer_homo_1000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d6617b14a76b60db6b34850c0056e4c870aa2b0a8eeb986b2098ccaef735e27
|
3 |
+
size 1414
|