qiuk6 commited on
Commit
87ebec2
·
verified ·
1 Parent(s): 43dfe98

Upload subfolder: exp141-fix-entropy-var-d16-fix-entropy

Browse files
exp141-fix-entropy-var-d16-fix-entropy/ar-ckpt-best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e152bfd31e298c21396dd80c673b34e38ee096cc74bbd43159cf4ea30bc8537
3
+ size 5199119774
exp141-fix-entropy-var-d16-fix-entropy/ar-ckpt-last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e152bfd31e298c21396dd80c673b34e38ee096cc74bbd43159cf4ea30bc8537
3
+ size 5199119774
exp141-fix-entropy-var-d16-fix-entropy/log.txt ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "is_master": true,
3
+ "name": "text",
4
+ "cmd": "--depth=16 --bs=768 --ep=350 --fp16=1 --alng=1e-4 --wpe=0.01 --tblr=8e-5 --data_path /mnt/localssd/ImageNet2012/ --workers 12 --vfast 2 --tfast 2 --encoder_model vit_base_patch14_dinov2.lvd142m --decoder_model vit_base_patch14_dinov2.lvd142m --product_quant 2 --semantic_guide dinov2 --num_latent_tokens 121 --codebook_embed_dim 14 --codebook_size 16384 --v_patch_nums 1 1 2 3 3 4 5 6 8 11 --pn 1_1_2_3_3_4_5_6_8_11 --patch_size 11 --local_out_dir_path /sensei-fs/users/xiangl/exp141-fix-entropy-var-d16-fix-entropy --vae_ckpt /sensei-fs/users/xiangl/output/exp141-fix-entropy/best_ckpt.pt --p_drop 0.0 --st_ep 50 --ed_ep 150 --sem_half True --clip_norm True --scale 1.0 --encoder_depth 6 --proj_coef 0.2 --query False",
5
+ "commit": "a2229298db3e1d35d196f16623f86dea25402aa2",
6
+ "branch": "main",
7
+ "tb_log_dir_path": "/sensei-fs/users/xiangl/exp141-fix-entropy-var-d16-fix-entropy/tb-VARd16__pn1_1_2_3_3_4_5_6_8_11__b768ep350adamlr8e-05wd0.05"
8
+ }
9
+
10
+ {'it': '1669/1669', 'ep': '271/350', 'lr': 6.000451983634238e-05, 'wd': 0.05, 'grad_norm': 0.5359155416488648, 'L_mean': 6.791825395822525, 'L_tail': 6.083762213587761, 'acc_mean': 2.6938556868117303, 'acc_tail': 4.2413482058327645, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '13:20:59', 'finish_time': '2024-11-27 05:27'}
11
+ {'it': '1669/1669', 'ep': '271/350', 'lr': 6.000451983634238e-05, 'wd': 0.05, 'grad_norm': 0.5359155416488648, 'L_mean': 6.791825395822525, 'L_tail': 6.083762213587761, 'acc_mean': 2.6938556868117303, 'acc_tail': 4.2413482058327645, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:20:19', 'finish_time': '2024-11-27 05:27'}
12
+ {'it': '1669/1669', 'ep': '271/350', 'lr': 6.000451983634238e-05, 'wd': 0.05, 'grad_norm': 0.5359155416488648, 'L_mean': 6.791825395822525, 'L_tail': 6.083762213587761, 'acc_mean': 2.6938556868117303, 'acc_tail': 4.2413482058327645, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:20:34', 'finish_time': '2024-11-27 05:27'}
13
+ {'it': '1669/1669', 'ep': '271/350', 'lr': 6.000451983634238e-05, 'wd': 0.05, 'grad_norm': 0.5359155416488648, 'L_mean': 6.791825395822525, 'L_tail': 6.083762213587761, 'acc_mean': 2.6938556868117303, 'acc_tail': 4.2413482058327645, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:20:30', 'finish_time': '2024-11-27 05:27'}
14
+ {'it': '1669/1669', 'ep': '272/350', 'lr': 5.9275348699173496e-05, 'wd': 0.05, 'grad_norm': 0.5333468794822693, 'L_mean': 6.7901948422193525, 'L_tail': 6.077424195408821, 'acc_mean': 2.6928540802327916, 'acc_tail': 4.2304795572999865, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:11:34', 'finish_time': '2024-11-27 05:28'}
15
+ {'it': '1669/1669', 'ep': '272/350', 'lr': 5.9275348699173496e-05, 'wd': 0.05, 'grad_norm': 0.5333468794822693, 'L_mean': 6.7901948422193525, 'L_tail': 6.077424195408821, 'acc_mean': 2.6928540802327916, 'acc_tail': 4.2304795572999865, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '13:11:59', 'finish_time': '2024-11-27 05:29'}
16
+ {'it': '1669/1669', 'ep': '272/350', 'lr': 5.9275348699173496e-05, 'wd': 0.05, 'grad_norm': 0.5333468794822693, 'L_mean': 6.7901948422193525, 'L_tail': 6.077424195408821, 'acc_mean': 2.6928540802327916, 'acc_tail': 4.2304795572999865, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:11:49', 'finish_time': '2024-11-27 05:28'}
17
+ {'it': '1669/1669', 'ep': '272/350', 'lr': 5.9275348699173496e-05, 'wd': 0.05, 'grad_norm': 0.5333468794822693, 'L_mean': 6.7901948422193525, 'L_tail': 6.077424195408821, 'acc_mean': 2.6928540802327916, 'acc_tail': 4.2304795572999865, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:11:45', 'finish_time': '2024-11-27 05:28'}
18
+ {'it': '1669/1669', 'ep': '273/350', 'lr': 5.8546177562004615e-05, 'wd': 0.05, 'grad_norm': 0.5425156474113464, 'L_mean': 6.786883442103862, 'L_tail': 6.075342810153961, 'acc_mean': 2.7019595564343035, 'acc_tail': 4.235537245403975, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:02:43', 'finish_time': '2024-11-27 05:29'}
19
+ {'it': '1669/1669', 'ep': '273/350', 'lr': 5.8546177562004615e-05, 'wd': 0.05, 'grad_norm': 0.5425156474113464, 'L_mean': 6.786883442103862, 'L_tail': 6.075342810153961, 'acc_mean': 2.7019595564343035, 'acc_tail': 4.235537245403975, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:03:15', 'finish_time': '2024-11-27 05:30'}
20
+ {'it': '1669/1669', 'ep': '273/350', 'lr': 5.8546177562004615e-05, 'wd': 0.05, 'grad_norm': 0.5425156474113464, 'L_mean': 6.786883442103862, 'L_tail': 6.075342810153961, 'acc_mean': 2.7019595564343035, 'acc_tail': 4.235537245403975, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '13:02:17', 'finish_time': '2024-11-27 05:29'}
21
+ {'it': '1669/1669', 'ep': '273/350', 'lr': 5.8546177562004615e-05, 'wd': 0.05, 'grad_norm': 0.5425156474113464, 'L_mean': 6.786883442103862, 'L_tail': 6.075342810153961, 'acc_mean': 2.7019595564343035, 'acc_tail': 4.235537245403975, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '13:02:49', 'finish_time': '2024-11-27 05:29'}
22
+ {'it': '1669/1669', 'ep': '274/350', 'lr': 5.781700642483572e-05, 'wd': 0.05, 'grad_norm': 0.534391438961029, 'L_mean': 6.7892611742019655, 'L_tail': 6.077712887525559, 'acc_mean': 2.6965873374138027, 'acc_tail': 4.252539662411436, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:52:25', 'finish_time': '2024-11-27 05:30'}
23
+ {'it': '1669/1669', 'ep': '274/350', 'lr': 5.781700642483572e-05, 'wd': 0.05, 'grad_norm': 0.534391438961029, 'L_mean': 6.7892611742019655, 'L_tail': 6.077712887525559, 'acc_mean': 2.6965873374138027, 'acc_tail': 4.252539662411436, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:52:20', 'finish_time': '2024-11-27 05:29'}
24
+ {'it': '1669/1669', 'ep': '274/350', 'lr': 5.781700642483572e-05, 'wd': 0.05, 'grad_norm': 0.534391438961029, 'L_mean': 6.7892611742019655, 'L_tail': 6.077712887525559, 'acc_mean': 2.6965873374138027, 'acc_tail': 4.252539662411436, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '12:52:08', 'finish_time': '2024-11-27 05:29'}
25
+ {'it': '1669/1669', 'ep': '274/350', 'lr': 5.781700642483572e-05, 'wd': 0.05, 'grad_norm': 0.534391438961029, 'L_mean': 6.7892611742019655, 'L_tail': 6.077712887525559, 'acc_mean': 2.6965873374138027, 'acc_tail': 4.252539662411436, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:52:02', 'finish_time': '2024-11-27 05:29'}
26
+ {'it': '1669/1669', 'ep': '275/350', 'lr': 5.708783528766684e-05, 'wd': 0.05, 'grad_norm': 0.5491738438606262, 'L_mean': 6.785212810337543, 'L_tail': 6.075842995941639, 'acc_mean': 2.709653691854328, 'acc_tail': 4.25383098248858, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:41:15', 'finish_time': '2024-11-27 05:29'}
27
+ {'it': '1669/1669', 'ep': '275/350', 'lr': 5.708783528766684e-05, 'wd': 0.05, 'grad_norm': 0.5491738438606262, 'L_mean': 6.785212810337543, 'L_tail': 6.075842995941639, 'acc_mean': 2.709653691854328, 'acc_tail': 4.25383098248858, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:41:19', 'finish_time': '2024-11-27 05:29'}
28
+ {'it': '1669/1669', 'ep': '275/350', 'lr': 5.708783528766684e-05, 'wd': 0.05, 'grad_norm': 0.5491738438606262, 'L_mean': 6.785212810337543, 'L_tail': 6.075842995941639, 'acc_mean': 2.709653691854328, 'acc_tail': 4.25383098248858, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:41:18', 'finish_time': '2024-11-27 05:29'}
29
+ {'it': '1669/1669', 'ep': '275/350', 'lr': 5.708783528766684e-05, 'wd': 0.05, 'grad_norm': 0.5491738438606262, 'L_mean': 6.785212810337543, 'L_tail': 6.075842995941639, 'acc_mean': 2.709653691854328, 'acc_tail': 4.25383098248858, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '12:40:11', 'finish_time': '2024-11-27 05:27'}
30
+ {'it': '1669/1669', 'ep': '276/350', 'lr': 5.635866415049794e-05, 'wd': 0.05, 'grad_norm': 0.544178307056427, 'L_mean': 6.789686697721481, 'L_tail': 6.07426570057869, 'acc_mean': 2.7111105620861053, 'acc_tail': 4.252754895715043, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '12:27:50', 'finish_time': '2024-11-27 05:25'}
31
+ {'it': '1669/1669', 'ep': '276/350', 'lr': 5.635866415049794e-05, 'wd': 0.05, 'grad_norm': 0.544178307056427, 'L_mean': 6.789686697721481, 'L_tail': 6.07426570057869, 'acc_mean': 2.7111105620861053, 'acc_tail': 4.252754895715043, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:27:51', 'finish_time': '2024-11-27 05:25'}
32
+ {'it': '1669/1669', 'ep': '276/350', 'lr': 5.635866415049794e-05, 'wd': 0.05, 'grad_norm': 0.544178307056427, 'L_mean': 6.789686697721481, 'L_tail': 6.07426570057869, 'acc_mean': 2.7111105620861053, 'acc_tail': 4.252754895715043, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:27:43', 'finish_time': '2024-11-27 05:25'}
33
+ {'it': '1669/1669', 'ep': '276/350', 'lr': 5.635866415049794e-05, 'wd': 0.05, 'grad_norm': 0.544178307056427, 'L_mean': 6.789686697721481, 'L_tail': 6.07426570057869, 'acc_mean': 2.7111105620861053, 'acc_tail': 4.252754895715043, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:27:48', 'finish_time': '2024-11-27 05:25'}
34
+ {'it': '1669/1669', 'ep': '277/350', 'lr': 5.562949301332906e-05, 'wd': 0.05, 'grad_norm': 0.5563566207885742, 'L_mean': 6.795723493397236, 'L_tail': 6.083289729058743, 'acc_mean': 2.6821096218191087, 'acc_tail': 4.220148990279995, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '12:19:28', 'finish_time': '2024-11-27 05:27'}
35
+ {'it': '1669/1669', 'ep': '277/350', 'lr': 5.562949301332906e-05, 'wd': 0.05, 'grad_norm': 0.5563566207885742, 'L_mean': 6.795723493397236, 'L_tail': 6.083289729058743, 'acc_mean': 2.6821096218191087, 'acc_tail': 4.220148990279995, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:19:24', 'finish_time': '2024-11-27 05:27'}
36
+ {'it': '1669/1669', 'ep': '277/350', 'lr': 5.562949301332906e-05, 'wd': 0.05, 'grad_norm': 0.5563566207885742, 'L_mean': 6.795723493397236, 'L_tail': 6.083289729058743, 'acc_mean': 2.6821096218191087, 'acc_tail': 4.220148990279995, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:19:21', 'finish_time': '2024-11-27 05:27'}
37
+ {'it': '1669/1669', 'ep': '277/350', 'lr': 5.562949301332906e-05, 'wd': 0.05, 'grad_norm': 0.5563566207885742, 'L_mean': 6.795723493397236, 'L_tail': 6.083289729058743, 'acc_mean': 2.6821096218191087, 'acc_tail': 4.220148990279995, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:19:40', 'finish_time': '2024-11-27 05:28'}
38
+ {'it': '1669/1669', 'ep': '278/350', 'lr': 5.4900321876160165e-05, 'wd': 0.05, 'grad_norm': 0.5624058365821838, 'L_mean': 6.788099612295627, 'L_tail': 6.073668879270554, 'acc_mean': 2.700821374892257, 'acc_tail': 4.249741793028079, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:12:16', 'finish_time': '2024-11-27 05:30'}
39
+ {'it': '1669/1669', 'ep': '278/350', 'lr': 5.4900321876160165e-05, 'wd': 0.05, 'grad_norm': 0.5624058365821838, 'L_mean': 6.788099612295627, 'L_tail': 6.073668879270554, 'acc_mean': 2.700821374892257, 'acc_tail': 4.249741793028079, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:12:04', 'finish_time': '2024-11-27 05:30'}
40
+ {'it': '1669/1669', 'ep': '278/350', 'lr': 5.4900321876160165e-05, 'wd': 0.05, 'grad_norm': 0.5624058365821838, 'L_mean': 6.788099612295627, 'L_tail': 6.073668879270554, 'acc_mean': 2.700821374892257, 'acc_tail': 4.249741793028079, 'vL_mean': None, 'vL_tail': None, 'vacc_mean': None, 'vacc_tail': None, 'remain_time': '12:11:26', 'finish_time': '2024-11-27 05:29'}
41
+ {'it': '1669/1669', 'ep': '278/350', 'lr': 5.4900321876160165e-05, 'wd': 0.05, 'grad_norm': 0.5624058365821838, 'L_mean': 6.788099612295627, 'L_tail': 6.073668879270554, 'acc_mean': 2.700821374892257, 'acc_tail': 4.249741793028079, 'vL_mean': 6.795849323272705, 'vL_tail': 6.034725666046143, 'vacc_mean': 2.7058706283569336, 'vacc_tail': 4.346347332000732, 'remain_time': '12:11:14', 'finish_time': '2024-11-27 05:29'}
exp141-fix-entropy-var-d16-fix-entropy/stderr.txt ADDED
The diff for this file is too large to render. See raw diff
 
exp141-fix-entropy-var-d16-fix-entropy/stdout.txt ADDED
The diff for this file is too large to render. See raw diff
 
exp141-fix-entropy-var-d16-fix-entropy/tb-VARd16__pn1_1_2_3_3_4_5_6_8_11__b768ep350adamlr8e-05wd0.05/events.out.tfevents.1732495906.msvq-var-train-140-master-0.229334.0__1125_0851 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9220880d839960181f52468dc2703d7d5bfddab1d1bd0a922b897911e21a2d17
3
+ size 511699