{"sae": {"activation": "topk", "expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "transcode": false}, "batch_size": 4, "grad_acc_steps": 8, "micro_acc_steps": 1, "optimizer": "signum", "lr": null, "lr_warmup_steps": 1000, "k_decay_steps": 0, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["layers.31", "layers.39", "layers.47"], "init_seeds": [0], "layers": [31, 39, 47], "layer_stride": 1, "distribute_modules": false, "save_every": 1500, "log_to_wandb": true, "run_name": null, "wandb_log_frequency": 1, "model": "unsloth/Qwen2.5-Coder-32B-Instruct", "dataset": "EleutherAI/fineweb-edu-dedup-10b", "split": "train[:10%]", "ctx_len": 2048, "hf_token": null, "revision": null, "load_in_8bit": true, "max_examples": null, "resume": false, "text_column": "text", "finetune": null, "shuffle_seed": 42, "data_preprocessing_num_proc": 72}