jdorairaj commited on
Commit
65da318
Β·
1 Parent(s): 4840f3d

lllaplace

Browse files
This view is limited to 50 files because it contains too many changes. Β  See raw diff
Files changed (50) hide show
  1. outputs/qqp/args.json +42 -0
  2. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/README.md +0 -0
  3. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_config.json +0 -0
  4. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_model.safetensors +0 -0
  5. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results.json +0 -0
  6. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_all_homo_mc_corr_1000.json +0 -0
  7. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_last_layer_homo_mc_corr_1000.json +1 -0
  8. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res.json +0 -0
  9. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
  10. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_last_layer_homo_mc_corr_1000.json +0 -0
  11. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/gpu_stats.json +127 -0
  12. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/special_tokens_map.json +0 -0
  13. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer.json +0 -0
  14. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer_config.json +0 -0
  15. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/vocab.txt +0 -0
  16. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/README.md +0 -0
  17. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_config.json +0 -0
  18. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_model.safetensors +0 -0
  19. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results.json +0 -0
  20. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_all_homo_mc_corr_1000.json +0 -0
  21. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_last_layer_homo_mc_corr_1000.json +1 -0
  22. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res.json +0 -0
  23. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
  24. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_last_layer_homo_mc_corr_1000.json +0 -0
  25. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/gpu_stats.json +127 -0
  26. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/special_tokens_map.json +0 -0
  27. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer.json +0 -0
  28. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer_config.json +0 -0
  29. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/vocab.txt +0 -0
  30. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/README.md +0 -0
  31. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_config.json +0 -0
  32. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_model.safetensors +0 -0
  33. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results.json +0 -0
  34. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_all_homo_mc_corr_1000.json +0 -0
  35. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_last_layer_homo_mc_corr_1000.json +1 -0
  36. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res.json +0 -0
  37. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
  38. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_last_layer_homo_mc_corr_1000.json +0 -0
  39. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/gpu_stats.json +127 -0
  40. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/special_tokens_map.json +0 -0
  41. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer.json +0 -0
  42. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer_config.json +0 -0
  43. outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/vocab.txt +0 -0
  44. outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/steps.json +5 -0
  45. outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_mu_kron_last_layer_homo_1000.pt +3 -0
  46. outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_var_kron_last_layer_homo_1000.pt +3 -0
  47. outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/prior_precision_kron_last_layer_homo_1000.pt +3 -0
  48. outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_mu_kron_last_layer_homo_1000.pt +3 -0
  49. outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_var_kron_last_layer_homo_1000.pt +3 -0
  50. outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/prior_precision_kron_last_layer_homo_1000.pt +3 -0
outputs/qqp/args.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task_name": "qqp",
3
+ "train_file": null,
4
+ "validation_file": null,
5
+ "max_length": 256,
6
+ "pad_to_max_length": false,
7
+ "model_name_or_path": "google-bert/bert-base-uncased",
8
+ "use_slow_tokenizer": false,
9
+ "per_device_train_batch_size": 32,
10
+ "per_device_eval_batch_size": 32,
11
+ "learning_rate": 5e-05,
12
+ "weight_decay": 0.0,
13
+ "num_train_epochs": 5,
14
+ "max_train_steps": null,
15
+ "gradient_accumulation_steps": 1,
16
+ "lr_scheduler_type": "linear",
17
+ "num_warmup_steps": 0,
18
+ "output_dir": "./outputs",
19
+ "peft_method": null,
20
+ "seed": 42,
21
+ "push_to_hub": false,
22
+ "hub_model_id": null,
23
+ "hub_token": null,
24
+ "checkpointing_steps": "1000",
25
+ "resume_from_checkpoint": null,
26
+ "with_tracking": false,
27
+ "report_to": "all",
28
+ "ignore_mismatched_sizes": true,
29
+ "save": false,
30
+ "load_step": 999,
31
+ "lora_r": 8,
32
+ "lora_alpha": 16,
33
+ "lora_dropout": 0.1,
34
+ "laplace_hessian": "kron",
35
+ "laplace_sub": "last_layer",
36
+ "laplace_prior": "homo",
37
+ "laplace_optim_step": 1000,
38
+ "testing_set": "val",
39
+ "laplace_predict": "mc_corr",
40
+ "lm_head": true,
41
+ "cache_dir": "/content/cache/huggingface/metrics/"
42
+ }
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/README.md RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_config.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/adapter_model.safetensors RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_all_homo_mc_corr_1000.json RENAMED
File without changes
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/all_results_la_kron_last_layer_homo_mc_corr_1000.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"eval_accuracy": 0.3999752658916646, "eval_f1": 0.5510003886801532}
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json RENAMED
File without changes
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/eval_res_la_kron_last_layer_homo_mc_corr_1000.json ADDED
The diff for this file is too large to render. See raw diff
 
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/gpu_stats.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "memory_allocated": 2368281600,
3
+ "max_memory_allocated": 2743742464,
4
+ "memory_reserved": 3382706176,
5
+ "max_memory_reserved": 3382706176,
6
+ "memory_stats": {
7
+ "active.all.allocated": 6631649,
8
+ "active.all.current": 3220,
9
+ "active.all.freed": 6628429,
10
+ "active.all.peak": 3230,
11
+ "active.large_pool.allocated": 4004527,
12
+ "active.large_pool.current": 274,
13
+ "active.large_pool.freed": 4004253,
14
+ "active.large_pool.peak": 283,
15
+ "active.small_pool.allocated": 2627122,
16
+ "active.small_pool.current": 2946,
17
+ "active.small_pool.freed": 2624176,
18
+ "active.small_pool.peak": 2955,
19
+ "active_bytes.all.allocated": 35764172915712,
20
+ "active_bytes.all.current": 2368281600,
21
+ "active_bytes.all.freed": 35761804634112,
22
+ "active_bytes.all.peak": 2743742464,
23
+ "active_bytes.large_pool.allocated": 34749907407872,
24
+ "active_bytes.large_pool.current": 2360377344,
25
+ "active_bytes.large_pool.freed": 34747547030528,
26
+ "active_bytes.large_pool.peak": 2737864704,
27
+ "active_bytes.small_pool.allocated": 1014265507840,
28
+ "active_bytes.small_pool.current": 7904256,
29
+ "active_bytes.small_pool.freed": 1014257603584,
30
+ "active_bytes.small_pool.peak": 11914240,
31
+ "allocated_bytes.all.allocated": 35764172915712,
32
+ "allocated_bytes.all.current": 2368281600,
33
+ "allocated_bytes.all.freed": 35761804634112,
34
+ "allocated_bytes.all.peak": 2743742464,
35
+ "allocated_bytes.large_pool.allocated": 34749907407872,
36
+ "allocated_bytes.large_pool.current": 2360377344,
37
+ "allocated_bytes.large_pool.freed": 34747547030528,
38
+ "allocated_bytes.large_pool.peak": 2737864704,
39
+ "allocated_bytes.small_pool.allocated": 1014265507840,
40
+ "allocated_bytes.small_pool.current": 7904256,
41
+ "allocated_bytes.small_pool.freed": 1014257603584,
42
+ "allocated_bytes.small_pool.peak": 11914240,
43
+ "allocation.all.allocated": 6631649,
44
+ "allocation.all.current": 3220,
45
+ "allocation.all.freed": 6628429,
46
+ "allocation.all.peak": 3230,
47
+ "allocation.large_pool.allocated": 4004527,
48
+ "allocation.large_pool.current": 274,
49
+ "allocation.large_pool.freed": 4004253,
50
+ "allocation.large_pool.peak": 283,
51
+ "allocation.small_pool.allocated": 2627122,
52
+ "allocation.small_pool.current": 2946,
53
+ "allocation.small_pool.freed": 2624176,
54
+ "allocation.small_pool.peak": 2955,
55
+ "inactive_split.all.allocated": 4292575,
56
+ "inactive_split.all.current": 116,
57
+ "inactive_split.all.freed": 4292459,
58
+ "inactive_split.all.peak": 131,
59
+ "inactive_split.large_pool.allocated": 2703344,
60
+ "inactive_split.large_pool.current": 109,
61
+ "inactive_split.large_pool.freed": 2703235,
62
+ "inactive_split.large_pool.peak": 118,
63
+ "inactive_split.small_pool.allocated": 1589231,
64
+ "inactive_split.small_pool.current": 7,
65
+ "inactive_split.small_pool.freed": 1589224,
66
+ "inactive_split.small_pool.peak": 17,
67
+ "inactive_split_bytes.all.allocated": 30727348120064,
68
+ "inactive_split_bytes.all.current": 408347648,
69
+ "inactive_split_bytes.all.freed": 30726939772416,
70
+ "inactive_split_bytes.all.peak": 582270464,
71
+ "inactive_split_bytes.large_pool.allocated": 29710313588224,
72
+ "inactive_split_bytes.large_pool.current": 407863296,
73
+ "inactive_split_bytes.large_pool.freed": 29709905724928,
74
+ "inactive_split_bytes.large_pool.peak": 581795840,
75
+ "inactive_split_bytes.small_pool.allocated": 1017034531840,
76
+ "inactive_split_bytes.small_pool.current": 484352,
77
+ "inactive_split_bytes.small_pool.freed": 1017034047488,
78
+ "inactive_split_bytes.small_pool.peak": 5708800,
79
+ "max_split_size": -1,
80
+ "num_alloc_retries": 0,
81
+ "num_ooms": 0,
82
+ "oversize_allocations.allocated": 0,
83
+ "oversize_allocations.current": 0,
84
+ "oversize_allocations.freed": 0,
85
+ "oversize_allocations.peak": 0,
86
+ "oversize_segments.allocated": 0,
87
+ "oversize_segments.current": 0,
88
+ "oversize_segments.freed": 0,
89
+ "oversize_segments.peak": 0,
90
+ "requested_bytes.all.allocated": 34988260561798,
91
+ "requested_bytes.all.current": 2365680124,
92
+ "requested_bytes.all.freed": 34985894881674,
93
+ "requested_bytes.all.peak": 2741468112,
94
+ "requested_bytes.large_pool.allocated": 33974373525760,
95
+ "requested_bytes.large_pool.current": 2358112256,
96
+ "requested_bytes.large_pool.freed": 33972015413504,
97
+ "requested_bytes.large_pool.peak": 2735599616,
98
+ "requested_bytes.small_pool.allocated": 1013887036038,
99
+ "requested_bytes.small_pool.current": 7567868,
100
+ "requested_bytes.small_pool.freed": 1013879468170,
101
+ "requested_bytes.small_pool.peak": 11904040,
102
+ "reserved_bytes.all.allocated": 3873439744,
103
+ "reserved_bytes.all.current": 3382706176,
104
+ "reserved_bytes.all.freed": 490733568,
105
+ "reserved_bytes.all.peak": 3382706176,
106
+ "reserved_bytes.large_pool.allocated": 3856662528,
107
+ "reserved_bytes.large_pool.current": 3374317568,
108
+ "reserved_bytes.large_pool.freed": 482344960,
109
+ "reserved_bytes.large_pool.peak": 3374317568,
110
+ "reserved_bytes.small_pool.allocated": 16777216,
111
+ "reserved_bytes.small_pool.current": 8388608,
112
+ "reserved_bytes.small_pool.freed": 8388608,
113
+ "reserved_bytes.small_pool.peak": 14680064,
114
+ "segment.all.allocated": 145,
115
+ "segment.all.current": 129,
116
+ "segment.all.freed": 16,
117
+ "segment.all.peak": 132,
118
+ "segment.large_pool.allocated": 137,
119
+ "segment.large_pool.current": 125,
120
+ "segment.large_pool.freed": 12,
121
+ "segment.large_pool.peak": 125,
122
+ "segment.small_pool.allocated": 8,
123
+ "segment.small_pool.current": 4,
124
+ "segment.small_pool.freed": 4,
125
+ "segment.small_pool.peak": 7
126
+ }
127
+ }
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/special_tokens_map.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/tokenizer_config.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/vocab.txt RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/README.md RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_config.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/adapter_model.safetensors RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_all_homo_mc_corr_1000.json RENAMED
File without changes
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/all_results_la_kron_last_layer_homo_mc_corr_1000.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"eval_accuracy": 0.8454860252287905, "eval_f1": 0.7988278105175024}
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_all_homo_mc_corr_1000.json RENAMED
File without changes
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/eval_res_la_kron_last_layer_homo_mc_corr_1000.json ADDED
The diff for this file is too large to render. See raw diff
 
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/gpu_stats.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "memory_allocated": 2368412672,
3
+ "max_memory_allocated": 2743873536,
4
+ "memory_reserved": 3361734656,
5
+ "max_memory_reserved": 3382706176,
6
+ "memory_stats": {
7
+ "active.all.allocated": 13263297,
8
+ "active.all.current": 3220,
9
+ "active.all.freed": 13260077,
10
+ "active.all.peak": 3230,
11
+ "active.large_pool.allocated": 8009052,
12
+ "active.large_pool.current": 274,
13
+ "active.large_pool.freed": 8008778,
14
+ "active.large_pool.peak": 283,
15
+ "active.small_pool.allocated": 5254245,
16
+ "active.small_pool.current": 2946,
17
+ "active.small_pool.freed": 5251299,
18
+ "active.small_pool.peak": 2955,
19
+ "active_bytes.all.allocated": 71465896812544,
20
+ "active_bytes.all.current": 2368412672,
21
+ "active_bytes.all.freed": 71463528399872,
22
+ "active_bytes.all.peak": 2743873536,
23
+ "active_bytes.large_pool.allocated": 69437365796352,
24
+ "active_bytes.large_pool.current": 2360508416,
25
+ "active_bytes.large_pool.freed": 69435005287936,
26
+ "active_bytes.large_pool.peak": 2737995776,
27
+ "active_bytes.small_pool.allocated": 2028531016192,
28
+ "active_bytes.small_pool.current": 7904256,
29
+ "active_bytes.small_pool.freed": 2028523111936,
30
+ "active_bytes.small_pool.peak": 11914240,
31
+ "allocated_bytes.all.allocated": 71465896812544,
32
+ "allocated_bytes.all.current": 2368412672,
33
+ "allocated_bytes.all.freed": 71463528399872,
34
+ "allocated_bytes.all.peak": 2743873536,
35
+ "allocated_bytes.large_pool.allocated": 69437365796352,
36
+ "allocated_bytes.large_pool.current": 2360508416,
37
+ "allocated_bytes.large_pool.freed": 69435005287936,
38
+ "allocated_bytes.large_pool.peak": 2737995776,
39
+ "allocated_bytes.small_pool.allocated": 2028531016192,
40
+ "allocated_bytes.small_pool.current": 7904256,
41
+ "allocated_bytes.small_pool.freed": 2028523111936,
42
+ "allocated_bytes.small_pool.peak": 11914240,
43
+ "allocation.all.allocated": 13263297,
44
+ "allocation.all.current": 3220,
45
+ "allocation.all.freed": 13260077,
46
+ "allocation.all.peak": 3230,
47
+ "allocation.large_pool.allocated": 8009052,
48
+ "allocation.large_pool.current": 274,
49
+ "allocation.large_pool.freed": 8008778,
50
+ "allocation.large_pool.peak": 283,
51
+ "allocation.small_pool.allocated": 5254245,
52
+ "allocation.small_pool.current": 2946,
53
+ "allocation.small_pool.freed": 5251299,
54
+ "allocation.small_pool.peak": 2955,
55
+ "inactive_split.all.allocated": 9056214,
56
+ "inactive_split.all.current": 117,
57
+ "inactive_split.all.freed": 9056097,
58
+ "inactive_split.all.peak": 758,
59
+ "inactive_split.large_pool.allocated": 5877807,
60
+ "inactive_split.large_pool.current": 108,
61
+ "inactive_split.large_pool.freed": 5877699,
62
+ "inactive_split.large_pool.peak": 118,
63
+ "inactive_split.small_pool.allocated": 3178407,
64
+ "inactive_split.small_pool.current": 9,
65
+ "inactive_split.small_pool.freed": 3178398,
66
+ "inactive_split.small_pool.peak": 649,
67
+ "inactive_split_bytes.all.allocated": 61796334381056,
68
+ "inactive_split_bytes.all.current": 387245056,
69
+ "inactive_split_bytes.all.freed": 61795947136000,
70
+ "inactive_split_bytes.all.peak": 582270464,
71
+ "inactive_split_bytes.large_pool.allocated": 59762423342592,
72
+ "inactive_split_bytes.large_pool.current": 386760704,
73
+ "inactive_split_bytes.large_pool.freed": 59762036581888,
74
+ "inactive_split_bytes.large_pool.peak": 581795840,
75
+ "inactive_split_bytes.small_pool.allocated": 2033911038464,
76
+ "inactive_split_bytes.small_pool.current": 484352,
77
+ "inactive_split_bytes.small_pool.freed": 2033910554112,
78
+ "inactive_split_bytes.small_pool.peak": 6297600,
79
+ "max_split_size": -1,
80
+ "num_alloc_retries": 0,
81
+ "num_ooms": 0,
82
+ "oversize_allocations.allocated": 0,
83
+ "oversize_allocations.current": 0,
84
+ "oversize_allocations.freed": 0,
85
+ "oversize_allocations.peak": 0,
86
+ "oversize_segments.allocated": 0,
87
+ "oversize_segments.current": 0,
88
+ "oversize_segments.freed": 0,
89
+ "oversize_segments.peak": 0,
90
+ "requested_bytes.all.allocated": 69976504084237,
91
+ "requested_bytes.all.current": 2365680124,
92
+ "requested_bytes.all.freed": 69974138404113,
93
+ "requested_bytes.all.peak": 2741468112,
94
+ "requested_bytes.large_pool.allocated": 67948730012160,
95
+ "requested_bytes.large_pool.current": 2358112256,
96
+ "requested_bytes.large_pool.freed": 67946371899904,
97
+ "requested_bytes.large_pool.peak": 2735599616,
98
+ "requested_bytes.small_pool.allocated": 2027774072077,
99
+ "requested_bytes.small_pool.current": 7567868,
100
+ "requested_bytes.small_pool.freed": 2027766504209,
101
+ "requested_bytes.small_pool.peak": 11904040,
102
+ "reserved_bytes.all.allocated": 4970250240,
103
+ "reserved_bytes.all.current": 3361734656,
104
+ "reserved_bytes.all.freed": 1608515584,
105
+ "reserved_bytes.all.peak": 3382706176,
106
+ "reserved_bytes.large_pool.allocated": 4945084416,
107
+ "reserved_bytes.large_pool.current": 3353346048,
108
+ "reserved_bytes.large_pool.freed": 1591738368,
109
+ "reserved_bytes.large_pool.peak": 3374317568,
110
+ "reserved_bytes.small_pool.allocated": 25165824,
111
+ "reserved_bytes.small_pool.current": 8388608,
112
+ "reserved_bytes.small_pool.freed": 16777216,
113
+ "reserved_bytes.small_pool.peak": 14680064,
114
+ "segment.all.allocated": 173,
115
+ "segment.all.current": 128,
116
+ "segment.all.freed": 45,
117
+ "segment.all.peak": 132,
118
+ "segment.large_pool.allocated": 161,
119
+ "segment.large_pool.current": 124,
120
+ "segment.large_pool.freed": 37,
121
+ "segment.large_pool.peak": 125,
122
+ "segment.small_pool.allocated": 12,
123
+ "segment.small_pool.current": 4,
124
+ "segment.small_pool.freed": 8,
125
+ "segment.small_pool.peak": 7
126
+ }
127
+ }
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/special_tokens_map.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/tokenizer_config.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/vocab.txt RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/README.md RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_config.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/adapter_model.safetensors RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_all_homo_mc_corr_1000.json RENAMED
File without changes
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/all_results_la_kron_last_layer_homo_mc_corr_1000.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"eval_accuracy": 0.8571357902547613, "eval_f1": 0.8090073407843396}
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_all_homo_mc_corr_1000.json RENAMED
File without changes
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/eval_res_la_kron_last_layer_homo_mc_corr_1000.json ADDED
The diff for this file is too large to render. See raw diff
 
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/gpu_stats.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "memory_allocated": 2368412672,
3
+ "max_memory_allocated": 2743873536,
4
+ "memory_reserved": 3363831808,
5
+ "max_memory_reserved": 3382706176,
6
+ "memory_stats": {
7
+ "active.all.allocated": 19894944,
8
+ "active.all.current": 3220,
9
+ "active.all.freed": 19891724,
10
+ "active.all.peak": 3230,
11
+ "active.large_pool.allocated": 12013577,
12
+ "active.large_pool.current": 274,
13
+ "active.large_pool.freed": 12013303,
14
+ "active.large_pool.peak": 283,
15
+ "active.small_pool.allocated": 7881367,
16
+ "active.small_pool.current": 2946,
17
+ "active.small_pool.freed": 7878421,
18
+ "active.small_pool.peak": 2955,
19
+ "active_bytes.all.allocated": 107167620708864,
20
+ "active_bytes.all.current": 2368412672,
21
+ "active_bytes.all.freed": 107165252296192,
22
+ "active_bytes.all.peak": 2743873536,
23
+ "active_bytes.large_pool.allocated": 104124824184832,
24
+ "active_bytes.large_pool.current": 2360508416,
25
+ "active_bytes.large_pool.freed": 104122463676416,
26
+ "active_bytes.large_pool.peak": 2737995776,
27
+ "active_bytes.small_pool.allocated": 3042796524032,
28
+ "active_bytes.small_pool.current": 7904256,
29
+ "active_bytes.small_pool.freed": 3042788619776,
30
+ "active_bytes.small_pool.peak": 11914240,
31
+ "allocated_bytes.all.allocated": 107167620708864,
32
+ "allocated_bytes.all.current": 2368412672,
33
+ "allocated_bytes.all.freed": 107165252296192,
34
+ "allocated_bytes.all.peak": 2743873536,
35
+ "allocated_bytes.large_pool.allocated": 104124824184832,
36
+ "allocated_bytes.large_pool.current": 2360508416,
37
+ "allocated_bytes.large_pool.freed": 104122463676416,
38
+ "allocated_bytes.large_pool.peak": 2737995776,
39
+ "allocated_bytes.small_pool.allocated": 3042796524032,
40
+ "allocated_bytes.small_pool.current": 7904256,
41
+ "allocated_bytes.small_pool.freed": 3042788619776,
42
+ "allocated_bytes.small_pool.peak": 11914240,
43
+ "allocation.all.allocated": 19894944,
44
+ "allocation.all.current": 3220,
45
+ "allocation.all.freed": 19891724,
46
+ "allocation.all.peak": 3230,
47
+ "allocation.large_pool.allocated": 12013577,
48
+ "allocation.large_pool.current": 274,
49
+ "allocation.large_pool.freed": 12013303,
50
+ "allocation.large_pool.peak": 283,
51
+ "allocation.small_pool.allocated": 7881367,
52
+ "allocation.small_pool.current": 2946,
53
+ "allocation.small_pool.freed": 7878421,
54
+ "allocation.small_pool.peak": 2955,
55
+ "inactive_split.all.allocated": 13817601,
56
+ "inactive_split.all.current": 115,
57
+ "inactive_split.all.freed": 13817486,
58
+ "inactive_split.all.peak": 773,
59
+ "inactive_split.large_pool.allocated": 9052286,
60
+ "inactive_split.large_pool.current": 108,
61
+ "inactive_split.large_pool.freed": 9052178,
62
+ "inactive_split.large_pool.peak": 118,
63
+ "inactive_split.small_pool.allocated": 4765315,
64
+ "inactive_split.small_pool.current": 7,
65
+ "inactive_split.small_pool.freed": 4765308,
66
+ "inactive_split.small_pool.peak": 665,
67
+ "inactive_split_bytes.all.allocated": 92865379165184,
68
+ "inactive_split_bytes.all.current": 387245056,
69
+ "inactive_split_bytes.all.freed": 92864991920128,
70
+ "inactive_split_bytes.all.peak": 582270464,
71
+ "inactive_split_bytes.large_pool.allocated": 89814591620608,
72
+ "inactive_split_bytes.large_pool.current": 386760704,
73
+ "inactive_split_bytes.large_pool.freed": 89814204859904,
74
+ "inactive_split_bytes.large_pool.peak": 581795840,
75
+ "inactive_split_bytes.small_pool.allocated": 3050787544576,
76
+ "inactive_split_bytes.small_pool.current": 484352,
77
+ "inactive_split_bytes.small_pool.freed": 3050787060224,
78
+ "inactive_split_bytes.small_pool.peak": 6297600,
79
+ "max_split_size": -1,
80
+ "num_alloc_retries": 0,
81
+ "num_ooms": 0,
82
+ "oversize_allocations.allocated": 0,
83
+ "oversize_allocations.current": 0,
84
+ "oversize_allocations.freed": 0,
85
+ "oversize_allocations.peak": 0,
86
+ "oversize_segments.allocated": 0,
87
+ "oversize_segments.current": 0,
88
+ "oversize_segments.freed": 0,
89
+ "oversize_segments.peak": 0,
90
+ "requested_bytes.all.allocated": 104964747606675,
91
+ "requested_bytes.all.current": 2365680124,
92
+ "requested_bytes.all.freed": 104962381926551,
93
+ "requested_bytes.all.peak": 2741468112,
94
+ "requested_bytes.large_pool.allocated": 101923086498560,
95
+ "requested_bytes.large_pool.current": 2358112256,
96
+ "requested_bytes.large_pool.freed": 101920728386304,
97
+ "requested_bytes.large_pool.peak": 2735599616,
98
+ "requested_bytes.small_pool.allocated": 3041661108115,
99
+ "requested_bytes.small_pool.current": 7567868,
100
+ "requested_bytes.small_pool.freed": 3041653540247,
101
+ "requested_bytes.small_pool.peak": 11904040,
102
+ "reserved_bytes.all.allocated": 6090129408,
103
+ "reserved_bytes.all.current": 3363831808,
104
+ "reserved_bytes.all.freed": 2726297600,
105
+ "reserved_bytes.all.peak": 3382706176,
106
+ "reserved_bytes.large_pool.allocated": 6054477824,
107
+ "reserved_bytes.large_pool.current": 3353346048,
108
+ "reserved_bytes.large_pool.freed": 2701131776,
109
+ "reserved_bytes.large_pool.peak": 3374317568,
110
+ "reserved_bytes.small_pool.allocated": 35651584,
111
+ "reserved_bytes.small_pool.current": 10485760,
112
+ "reserved_bytes.small_pool.freed": 25165824,
113
+ "reserved_bytes.small_pool.peak": 14680064,
114
+ "segment.all.allocated": 203,
115
+ "segment.all.current": 129,
116
+ "segment.all.freed": 74,
117
+ "segment.all.peak": 132,
118
+ "segment.large_pool.allocated": 186,
119
+ "segment.large_pool.current": 124,
120
+ "segment.large_pool.freed": 62,
121
+ "segment.large_pool.peak": 125,
122
+ "segment.small_pool.allocated": 17,
123
+ "segment.small_pool.current": 5,
124
+ "segment.small_pool.freed": 12,
125
+ "segment.small_pool.peak": 7
126
+ }
127
+ }
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/special_tokens_map.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/tokenizer_config.json RENAMED
File without changes
outputs/{google-bert β†’ qqp/google-bert}/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_54577/vocab.txt RENAMED
File without changes
outputs/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/steps.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ [
2
+ 0,
3
+ 27288,
4
+ 54577
5
+ ]
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_mu_kron_last_layer_homo_1000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bd24e936219cd2fdf79a74002fd93b9526dfab8212c81ddd2254df563da5a0f
3
+ size 324815
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/f_var_kron_last_layer_homo_1000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dc593ffbad0f4ee51cdc02fbe9ff33aaf44214ef472668b8dc62ef7ebbd0850
3
+ size 648212
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_0/prior_precision_kron_last_layer_homo_1000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61efa51d7df9d4cd224a805e15b8be2673cc94e0c225867cff51f76b8962039a
3
+ size 1414
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_mu_kron_last_layer_homo_1000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e9e2a94742c11148a07991cdda0b0f8d34d0c81bef4e336dc1ea171a63311f3
3
+ size 324815
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/f_var_kron_last_layer_homo_1000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71c7b83a790e3a6d1677fa2f4dcbc31a962d94d95b25cbdd25ff9be5bc2f3171
3
+ size 648212
outputs_laplace/qqp/google-bert/bert-base-uncased_lora_lmhead_16_0.1_5e-05_42/step_27288/prior_precision_kron_last_layer_homo_1000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d6617b14a76b60db6b34850c0056e4c870aa2b0a8eeb986b2098ccaef735e27
3
+ size 1414