y1y2y3 commited on
Commit
4ccf026
·
verified ·
1 Parent(s): 7441add

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +52 -61
config.json CHANGED
@@ -1,61 +1,52 @@
1
- {
2
- "type": "smolvla",
3
- "n_obs_steps": 1,
4
- "input_features": {
5
- "observation.state": {
6
- "type": "STATE",
7
- 6
8
- ]
9
- },
10
- "observation.images.camera1": {
11
- "type": "VISUAL",
12
- "shape": [
13
- 3,
14
- 256
15
- ]
16
- },
17
- "observation.images.camera2": {
18
- "type": "VISUAL",
19
- "shape": [
20
- 3,
21
- 256
22
- ]
23
- },
24
- "observation.images.camera3": {
25
- "type": "VISUAL",
26
- "shape": [
27
- 3,
28
- ]
29
- }
30
- },
31
- "device": "cuda",
32
- "use_amp": false,
33
- "push_to_hub": true,
34
- "repo_id": null,
35
- "private": null,
36
- "tags": null,
37
- "license": null,
38
- "chunk_size": 50,
39
- "n_action_steps": 50,
40
- "normalization_mapping": {
41
- "VISUAL": "IDENTITY",
42
- "STATE": "MEAN_STD",
43
- "ACTION": "MEAN_STD"
44
- },
45
- "max_state_dim": 32,
46
- "max_action_dim": 32,
47
- "resize_imgs_with_padding": [
48
- "scheduler_decay_lr": 2.5e-06,
49
- "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
50
- "load_vlm_weights": true,
51
- "add_image_special_tokens": false,
52
- "attention_mode": "cross_attn",
53
- "prefix_length": 0,
54
- "pad_language_to": "max_length",
55
- "num_expert_layers": 0,
56
- "num_vlm_layers": 16,
57
- "self_attn_every_n_layers": 2,
58
- "expert_width_multiplier": 0.75,
59
- "min_period": 0.004,
60
- "max_period": 4.0
61
- }
 
1
+ {
2
+ "type": "smolvla",
3
+ "n_obs_steps": 1,
4
+ "input_features": {
5
+ "observation.state": {
6
+ "type": "STATE",
7
+ "shape": [6]
8
+ },
9
+ "observation.images.camera1": {
10
+ "type": "VISUAL",
11
+ "shape": [3, 256]
12
+ },
13
+ "observation.images.camera2": {
14
+ "type": "VISUAL",
15
+ "shape": [3, 256]
16
+ },
17
+ "observation.images.camera3": {
18
+ "type": "VISUAL",
19
+ "shape": [3]
20
+ }
21
+ },
22
+ "device": "cuda",
23
+ "use_amp": false,
24
+ "push_to_hub": true,
25
+ "repo_id": null,
26
+ "private": null,
27
+ "tags": null,
28
+ "license": null,
29
+ "chunk_size": 50,
30
+ "n_action_steps": 50,
31
+ "normalization_mapping": {
32
+ "VISUAL": "IDENTITY",
33
+ "STATE": "MEAN_STD",
34
+ "ACTION": "MEAN_STD"
35
+ },
36
+ "max_state_dim": 32,
37
+ "max_action_dim": 32,
38
+ "resize_imgs_with_padding": [],
39
+ "scheduler_decay_lr": 2.5e-06,
40
+ "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
41
+ "load_vlm_weights": true,
42
+ "add_image_special_tokens": false,
43
+ "attention_mode": "cross_attn",
44
+ "prefix_length": 0,
45
+ "pad_language_to": "max_length",
46
+ "num_expert_layers": 0,
47
+ "num_vlm_layers": 16,
48
+ "self_attn_every_n_layers": 2,
49
+ "expert_width_multiplier": 0.75,
50
+ "min_period": 0.004,
51
+ "max_period": 4.0
52
+ }