Robotics
LeRobot
Safetensors
smolvla
incyvinvy commited on
Commit
878598d
·
verified ·
1 Parent(s): 1ceb7ba

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +67 -84
config.json CHANGED
@@ -1,88 +1,71 @@
1
  {
2
- "type": "smolvla",
3
- "n_obs_steps": 1,
4
- "normalization_mapping": {
5
- "VISUAL": "IDENTITY",
6
- "STATE": "MEAN_STD",
7
- "ACTION": "MEAN_STD"
 
 
 
 
 
 
8
  },
9
- "input_features": {
10
- "observation.state": {
11
- "type": "STATE",
12
- "shape": [
13
- 6
14
- ]
15
- },
16
- "observation.images.top": {
17
- "type": "VISUAL",
18
- "shape": [
19
- 3,
20
- 480,
21
- 640
22
- ]
23
- },
24
- "observation.images.wrist": {
25
- "type": "VISUAL",
26
- "shape": [
27
- 3,
28
- 480,
29
- 640
30
- ]
31
- }
32
  },
33
- "output_features": {
34
- "action": {
35
- "type": "ACTION",
36
- "shape": [
37
- 6
38
- ]
39
- }
40
- },
41
- "device": "cuda",
42
- "use_amp": false,
43
- "push_to_hub": true,
44
- "repo_id": "incyvinvy/smolvla_colabtrained_wandb",
45
- "private": null,
46
- "tags": null,
47
- "license": null,
48
- "chunk_size": 50,
49
- "n_action_steps": 50,
50
- "max_state_dim": 32,
51
- "max_action_dim": 32,
52
- "resize_imgs_with_padding": [
53
- 512,
54
- 512
55
- ],
56
- "empty_cameras": 0,
57
- "adapt_to_pi_aloha": false,
58
- "use_delta_joint_actions_aloha": false,
59
- "tokenizer_max_length": 48,
60
- "num_steps": 10,
61
- "use_cache": true,
62
- "freeze_vision_encoder": true,
63
- "train_expert_only": true,
64
- "train_state_proj": true,
65
- "optimizer_lr": 0.0001,
66
- "optimizer_betas": [
67
- 0.9,
68
- 0.95
69
- ],
70
- "optimizer_eps": 1e-08,
71
- "optimizer_weight_decay": 1e-10,
72
- "optimizer_grad_clip_norm": 10.0,
73
- "scheduler_warmup_steps": 1000,
74
- "scheduler_decay_steps": 30000,
75
- "scheduler_decay_lr": 2.5e-06,
76
- "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
77
- "load_vlm_weights": true,
78
- "add_image_special_tokens": false,
79
- "attention_mode": "cross_attn",
80
- "prefix_length": 0,
81
- "pad_language_to": "max_length",
82
- "num_expert_layers": 0,
83
- "num_vlm_layers": 16,
84
- "self_attn_every_n_layers": 2,
85
- "expert_width_multiplier": 0.75,
86
- "min_period": 0.004,
87
- "max_period": 4.0
88
  }
 
1
  {
2
+ "model_type": "smolvla",
3
+ "type": "smolvla",
4
+ "n_obs_steps": 1,
5
+ "normalization_mapping": {
6
+ "VISUAL": "IDENTITY",
7
+ "STATE": "MEAN_STD",
8
+ "ACTION": "MEAN_STD"
9
+ },
10
+ "input_features": {
11
+ "observation.state": {
12
+ "type": "STATE",
13
+ "shape": [6]
14
  },
15
+ "observation.images.top": {
16
+ "type": "VISUAL",
17
+ "shape": [3, 480, 640]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
18
  },
19
+ "observation.images.wrist": {
20
+ "type": "VISUAL",
21
+ "shape": [3, 480, 640]
22
+ }
23
+ },
24
+ "output_features": {
25
+ "action": {
26
+ "type": "ACTION",
27
+ "shape": [6]
28
+ }
29
+ },
30
+ "device": "cuda",
31
+ "use_amp": false,
32
+ "push_to_hub": true,
33
+ "repo_id": "incyvinvy/smolvla_colabtrained_wandb",
34
+ "private": null,
35
+ "tags": null,
36
+ "license": null,
37
+ "chunk_size": 50,
38
+ "n_action_steps": 50,
39
+ "max_state_dim": 32,
40
+ "max_action_dim": 32,
41
+ "resize_imgs_with_padding": [512, 512],
42
+ "empty_cameras": 0,
43
+ "adapt_to_pi_aloha": false,
44
+ "use_delta_joint_actions_aloha": false,
45
+ "tokenizer_max_length": 48,
46
+ "num_steps": 10,
47
+ "use_cache": true,
48
+ "freeze_vision_encoder": true,
49
+ "train_expert_only": true,
50
+ "train_state_proj": true,
51
+ "optimizer_lr": 0.0001,
52
+ "optimizer_betas": [0.9, 0.95],
53
+ "optimizer_eps": 1e-08,
54
+ "optimizer_weight_decay": 1e-10,
55
+ "optimizer_grad_clip_norm": 10.0,
56
+ "scheduler_warmup_steps": 1000,
57
+ "scheduler_decay_steps": 30000,
58
+ "scheduler_decay_lr": 2.5e-06,
59
+ "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
60
+ "load_vlm_weights": true,
61
+ "add_image_special_tokens": false,
62
+ "attention_mode": "cross_attn",
63
+ "prefix_length": 0,
64
+ "pad_language_to": "max_length",
65
+ "num_expert_layers": 0,
66
+ "num_vlm_layers": 16,
67
+ "self_attn_every_n_layers": 2,
68
+ "expert_width_multiplier": 0.75,
69
+ "min_period": 0.004,
70
+ "max_period": 4.0
 
 
 
71
  }