Robotics
LeRobot
Safetensors
smolvla
sleepyguy25 commited on
Commit
b420bdc
·
verified ·
1 Parent(s): 74e92b3

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +63 -0
  2. config.json +2 -2
  3. model.safetensors +1 -1
  4. train_config.json +6 -6
README.md ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: lerobot/smolvla_base
3
+ datasets: sleepyguy25/so1000
4
+ library_name: lerobot
5
+ license: apache-2.0
6
+ model_name: smolvla
7
+ pipeline_tag: robotics
8
+ tags:
9
+ - robotics
10
+ - smolvla
11
+ - lerobot
12
+ ---
13
+
14
+ # Model Card for smolvla
15
+
16
+ <!-- Provide a quick summary of what the model is/does. -->
17
+
18
+
19
+ [SmolVLA](https://huggingface.co/papers/2506.01844) is a compact, efficient vision-language-action model that achieves competitive performance at reduced computational costs and can be deployed on consumer-grade hardware.
20
+
21
+
22
+ This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).
23
+ See the full documentation at [LeRobot Docs](https://huggingface.co/docs/lerobot/index).
24
+
25
+ ---
26
+
27
+ ## How to Get Started with the Model
28
+
29
+ For a complete walkthrough, see the [training guide](https://huggingface.co/docs/lerobot/il_robots#train-a-policy).
30
+ Below is the short version on how to train and run inference/eval:
31
+
32
+ ### Train from scratch
33
+
34
+ ```bash
35
+ lerobot-train \
36
+ --dataset.repo_id=${HF_USER}/<dataset> \
37
+ --policy.type=act \
38
+ --output_dir=outputs/train/<desired_policy_repo_id> \
39
+ --job_name=lerobot_training \
40
+ --policy.device=cuda \
41
+ --policy.repo_id=${HF_USER}/<desired_policy_repo_id>
42
+ --wandb.enable=true
43
+ ```
44
+
45
+ _Writes checkpoints to `outputs/train/<desired_policy_repo_id>/checkpoints/`._
46
+
47
+ ### Evaluate the policy/run inference
48
+
49
+ ```bash
50
+ lerobot-record \
51
+ --robot.type=so100_follower \
52
+ --dataset.repo_id=<hf_user>/eval_<dataset> \
53
+ --policy.path=<hf_user>/<desired_policy_repo_id> \
54
+ --episodes=10
55
+ ```
56
+
57
+ Prefix the dataset repo with **eval\_** and supply `--policy.path` pointing to a local or hub checkpoint.
58
+
59
+ ---
60
+
61
+ ## Model Details
62
+
63
+ - **License:** apache-2.0
config.json CHANGED
@@ -41,7 +41,7 @@
41
  "device": "cuda",
42
  "use_amp": false,
43
  "push_to_hub": true,
44
- "repo_id": "sleepyguy25smol",
45
  "private": null,
46
  "tags": null,
47
  "license": null,
@@ -69,7 +69,7 @@
69
  ],
70
  "optimizer_eps": 1e-08,
71
  "optimizer_weight_decay": 1e-10,
72
- "optimizer_grad_clip_norm": 10,
73
  "scheduler_warmup_steps": 1000,
74
  "scheduler_decay_steps": 30000,
75
  "scheduler_decay_lr": 2.5e-06,
 
41
  "device": "cuda",
42
  "use_amp": false,
43
  "push_to_hub": true,
44
+ "repo_id": "sleepyguy25/smol",
45
  "private": null,
46
  "tags": null,
47
  "license": null,
 
69
  ],
70
  "optimizer_eps": 1e-08,
71
  "optimizer_weight_decay": 1e-10,
72
+ "optimizer_grad_clip_norm": 10.0,
73
  "scheduler_warmup_steps": 1000,
74
  "scheduler_decay_steps": 30000,
75
  "scheduler_decay_lr": 2.5e-06,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82f0deb01cba2c939da11f5b3bc3d1590bb244917b17468587f584a132a6034b
3
  size 906498200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cedf9be28ea7cb4e0d3df9f5abd8e25b80ebdef717465bd48bc95bbfef52313c
3
  size 906498200
train_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "dataset": {
3
- "repo_id": "sleepyguy25/pick",
4
  "root": "data",
5
  "episodes": null,
6
  "image_transforms": {
@@ -108,7 +108,7 @@
108
  "device": "cuda",
109
  "use_amp": false,
110
  "push_to_hub": true,
111
- "repo_id": "sleepyguy25smol",
112
  "private": null,
113
  "tags": null,
114
  "license": null,
@@ -136,7 +136,7 @@
136
  ],
137
  "optimizer_eps": 1e-08,
138
  "optimizer_weight_decay": 1e-10,
139
- "optimizer_grad_clip_norm": 10,
140
  "scheduler_warmup_steps": 1000,
141
  "scheduler_decay_steps": 30000,
142
  "scheduler_decay_lr": 2.5e-06,
@@ -153,13 +153,13 @@
153
  "min_period": 0.004,
154
  "max_period": 4.0
155
  },
156
- "output_dir": "outputs/train/my_smolvla",
157
  "job_name": "my_smolvla_training",
158
  "resume": false,
159
  "seed": 1000,
160
  "num_workers": 4,
161
  "batch_size": 16,
162
- "steps": 3700,
163
  "eval_freq": 500,
164
  "log_freq": 100,
165
  "save_checkpoint": true,
@@ -169,7 +169,7 @@
169
  "type": "adamw",
170
  "lr": 0.0001,
171
  "weight_decay": 1e-10,
172
- "grad_clip_norm": 10,
173
  "betas": [
174
  0.9,
175
  0.95
 
1
  {
2
  "dataset": {
3
+ "repo_id": "sleepyguy25/so1000",
4
  "root": "data",
5
  "episodes": null,
6
  "image_transforms": {
 
108
  "device": "cuda",
109
  "use_amp": false,
110
  "push_to_hub": true,
111
+ "repo_id": "sleepyguy25/smol",
112
  "private": null,
113
  "tags": null,
114
  "license": null,
 
136
  ],
137
  "optimizer_eps": 1e-08,
138
  "optimizer_weight_decay": 1e-10,
139
+ "optimizer_grad_clip_norm": 10.0,
140
  "scheduler_warmup_steps": 1000,
141
  "scheduler_decay_steps": 30000,
142
  "scheduler_decay_lr": 2.5e-06,
 
153
  "min_period": 0.004,
154
  "max_period": 4.0
155
  },
156
+ "output_dir": "outputs/train/my_smolvla1",
157
  "job_name": "my_smolvla_training",
158
  "resume": false,
159
  "seed": 1000,
160
  "num_workers": 4,
161
  "batch_size": 16,
162
+ "steps": 5000,
163
  "eval_freq": 500,
164
  "log_freq": 100,
165
  "save_checkpoint": true,
 
169
  "type": "adamw",
170
  "lr": 0.0001,
171
  "weight_decay": 1e-10,
172
+ "grad_clip_norm": 10.0,
173
  "betas": [
174
  0.9,
175
  0.95