{ | |
"data": { | |
"shard_root": "/gpfs/home/int/yizhenggong21/work/saev/acts/dinov2_vit_b_reg_-2_rand/db1e1e70eadeff77bb2c52febdc0f443b2fdddb2cf38447b2c0d1576a7e56045", | |
"patches": "patches", | |
"layer": -2, | |
"clamp": 100000.0, | |
"n_samples": 524288, | |
"shuffled": true, | |
"scale_mean": true, | |
"scale_norm": true | |
}, | |
"shuffle": false, | |
"n_workers": 4, | |
"pin_memory": true, | |
"prefetch_factor": 4, | |
"n_patches": 100000000, | |
"sae": { | |
"d_vit": 768, | |
"exp_factor": 16, | |
"n_reinit_samples": 524288, | |
"remove_parallel_grads": true, | |
"normalize_w_dec": true, | |
"seed": 315 | |
}, | |
"objective": { | |
"sparsity_coeff": 0.0004 | |
}, | |
"n_sparsity_warmup": 500, | |
"lr": 0.003, | |
"n_lr_warmup": 500, | |
"lr_scheduler": "warmup", | |
"lr_final_factor": 0.0, | |
"gradient_clip_value": 0.0, | |
"sae_batch_size": 16384, | |
"track": true, | |
"wandb_project": "saev", | |
"tag": "baseline-v4.8-dinov2-vit-b", | |
"log_every": 25, | |
"ckpt_path": "/gpfs/home/int/yizhenggong21/work/saev/checkpoints", | |
"device": "cuda", | |
"span_all_devices": true, | |
"seed": 48, | |
"slurm": false, | |
"slurm_acct": "PAS2136", | |
"log_to": "/gpfs/home/int/yizhenggong21/work/saev/logs" | |
} |