Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +44 -0
- .ipynb_checkpoints/denoising_progression_step_928000-checkpoint.png +3 -0
- .ipynb_checkpoints/evaluation_arc-prize-2025_evaluation_20251011_185417-checkpoint.json +0 -0
- best_model.pt +3 -0
- config.json +52 -0
- denoising_progression_step_016000.png +3 -0
- denoising_progression_step_336000.png +3 -0
- denoising_progression_step_352000.png +3 -0
- denoising_progression_step_368000.png +3 -0
- denoising_progression_step_384000.png +3 -0
- denoising_progression_step_400000.png +3 -0
- denoising_progression_step_416000.png +3 -0
- denoising_progression_step_432000.png +3 -0
- denoising_progression_step_448000.png +3 -0
- denoising_progression_step_464000.png +3 -0
- denoising_progression_step_480000.png +3 -0
- denoising_progression_step_496000.png +3 -0
- denoising_progression_step_512000.png +3 -0
- denoising_progression_step_528000.png +3 -0
- denoising_progression_step_544000.png +3 -0
- denoising_progression_step_560000.png +3 -0
- denoising_progression_step_576000.png +3 -0
- denoising_progression_step_592000.png +3 -0
- denoising_progression_step_608000.png +3 -0
- denoising_progression_step_624000.png +3 -0
- denoising_progression_step_640000.png +3 -0
- denoising_progression_step_656000.png +3 -0
- denoising_progression_step_672000.png +3 -0
- denoising_progression_step_688000.png +3 -0
- denoising_progression_step_704000.png +3 -0
- denoising_progression_step_720000.png +3 -0
- denoising_progression_step_736000.png +3 -0
- denoising_progression_step_752000.png +3 -0
- denoising_progression_step_768000.png +3 -0
- denoising_progression_step_784000.png +3 -0
- denoising_progression_step_800000.png +3 -0
- denoising_progression_step_816000.png +3 -0
- denoising_progression_step_832000.png +3 -0
- denoising_progression_step_848000.png +3 -0
- denoising_progression_step_864000.png +3 -0
- denoising_progression_step_880000.png +3 -0
- denoising_progression_step_896000.png +3 -0
- denoising_progression_step_912000.png +3 -0
- denoising_progression_step_928000.png +3 -0
- denoising_progression_step_944000.png +3 -0
- denoising_progression_step_960000.png +3 -0
- denoising_progression_step_976000.png +3 -0
- denoising_progression_step_992000.png +3 -0
- evaluation_arc-prize-2025_evaluation_20251011_185417.json +0 -0
- final_model.pt +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,47 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
.ipynb_checkpoints/denoising_progression_step_928000-checkpoint.png filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
denoising_progression_step_992000.png filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
denoising_progression_step_016000.png filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
denoising_progression_step_944000.png filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
denoising_progression_step_960000.png filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
denoising_progression_step_912000.png filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
denoising_progression_step_928000.png filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
denoising_progression_step_896000.png filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
denoising_progression_step_976000.png filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
denoising_progression_step_864000.png filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
denoising_progression_step_880000.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
denoising_progression_step_800000.png filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
denoising_progression_step_848000.png filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
denoising_progression_step_832000.png filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
denoising_progression_step_816000.png filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
denoising_progression_step_784000.png filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
denoising_progression_step_720000.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
denoising_progression_step_736000.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
denoising_progression_step_688000.png filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
denoising_progression_step_768000.png filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
denoising_progression_step_704000.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
denoising_progression_step_752000.png filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
denoising_progression_step_656000.png filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
denoising_progression_step_672000.png filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
denoising_progression_step_608000.png filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
denoising_progression_step_592000.png filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
denoising_progression_step_624000.png filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
denoising_progression_step_640000.png filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
denoising_progression_step_576000.png filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
denoising_progression_step_544000.png filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
denoising_progression_step_560000.png filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
denoising_progression_step_528000.png filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
denoising_progression_step_480000.png filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
denoising_progression_step_496000.png filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
denoising_progression_step_512000.png filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
denoising_progression_step_464000.png filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
denoising_progression_step_448000.png filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
denoising_progression_step_432000.png filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
denoising_progression_step_368000.png filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
denoising_progression_step_384000.png filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
denoising_progression_step_416000.png filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
denoising_progression_step_400000.png filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
denoising_progression_step_352000.png filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
denoising_progression_step_336000.png filter=lfs diff=lfs merge=lfs -text
|
.ipynb_checkpoints/denoising_progression_step_928000-checkpoint.png
ADDED
|
Git LFS Details
|
.ipynb_checkpoints/evaluation_arc-prize-2025_evaluation_20251011_185417-checkpoint.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
best_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a161bda444f0fbe32996ec1e1cc03021bbd7e8adeff3a55cb4f69d984add81a2
|
| 3 |
+
size 16119157
|
config.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_version": "smol-v7-1M",
|
| 3 |
+
"tag": "aa2",
|
| 4 |
+
"vocab_size": 11,
|
| 5 |
+
"d_model": 384,
|
| 6 |
+
"nhead": 6,
|
| 7 |
+
"num_layers": 4,
|
| 8 |
+
"max_size": 30,
|
| 9 |
+
"embedding_dropout": 0.1,
|
| 10 |
+
"input_grid_dropout": 0.05,
|
| 11 |
+
"num_timesteps": 128,
|
| 12 |
+
"schedule_type": "cosine",
|
| 13 |
+
"batch_size": 128,
|
| 14 |
+
"learning_rate": 0.0004,
|
| 15 |
+
"weight_decay": 0.01,
|
| 16 |
+
"optimizer_steps": 1000000,
|
| 17 |
+
"lr_warmup_steps": 2000,
|
| 18 |
+
"gradient_accumulation_steps": 1,
|
| 19 |
+
"augment": true,
|
| 20 |
+
"log_every": 100,
|
| 21 |
+
"val_every_steps": 1000,
|
| 22 |
+
"vis_every_steps": 16000,
|
| 23 |
+
"eval_every_steps": 25000,
|
| 24 |
+
"num_eval_tasks": 120,
|
| 25 |
+
"best_model_metric": "eval_score",
|
| 26 |
+
"eval_dataset": "evaluation",
|
| 27 |
+
"use_mixed_precision": true,
|
| 28 |
+
"pixel_noise_prob": 0.0,
|
| 29 |
+
"pixel_noise_rate": 0.0,
|
| 30 |
+
"use_ema": true,
|
| 31 |
+
"ema_decay": 0.9995,
|
| 32 |
+
"ema_warmup_steps": 2000,
|
| 33 |
+
"data_dir": "data/arc-prize-2025",
|
| 34 |
+
"datasets": [
|
| 35 |
+
"training_challenges",
|
| 36 |
+
"evaluation_challenges"
|
| 37 |
+
],
|
| 38 |
+
"include_training_test_examples": true,
|
| 39 |
+
"max_val_examples": 128,
|
| 40 |
+
"eval_weight": 10.0,
|
| 41 |
+
"output_dir": "experimental/diffusion/outputs/smol",
|
| 42 |
+
"use_wandb": true,
|
| 43 |
+
"save_best": true,
|
| 44 |
+
"save_final": true,
|
| 45 |
+
"auxiliary_loss": {
|
| 46 |
+
"include_size_head": true,
|
| 47 |
+
"size_head_hidden_dim": 256,
|
| 48 |
+
"auxiliary_size_loss_weight": 0.1,
|
| 49 |
+
"auxiliary_size_loss_warmup": 0
|
| 50 |
+
},
|
| 51 |
+
"profile_mode": false
|
| 52 |
+
}
|
denoising_progression_step_016000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_336000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_352000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_368000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_384000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_400000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_416000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_432000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_448000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_464000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_480000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_496000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_512000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_528000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_544000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_560000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_576000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_592000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_608000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_624000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_640000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_656000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_672000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_688000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_704000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_720000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_736000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_752000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_768000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_784000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_800000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_816000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_832000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_848000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_864000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_880000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_896000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_912000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_928000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_944000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_960000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_976000.png
ADDED
|
Git LFS Details
|
denoising_progression_step_992000.png
ADDED
|
Git LFS Details
|
evaluation_arc-prize-2025_evaluation_20251011_185417.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
final_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3414550a25421f5245d7bcd0454ca065216b8d3d4754f9dd846fdf0628f04d06
|
| 3 |
+
size 16119364
|