m1b commited on
Commit
58e0f6f
1 Parent(s): d04888c

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. README.md +9 -0
  2. config.json +46 -0
  3. config.yaml +227 -0
  4. model.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Library: [More Information Needed]
9
+ - Docs: [More Information Needed]
config.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "chunk_size": 100,
3
+ "dim_feedforward": 3200,
4
+ "dim_model": 512,
5
+ "dropout": 0.1,
6
+ "feedforward_activation": "relu",
7
+ "input_normalization_modes": {
8
+ "observation.images.top": "mean_std",
9
+ "observation.state": "mean_std"
10
+ },
11
+ "input_shapes": {
12
+ "dataset_index": [
13
+ 1
14
+ ],
15
+ "observation.images.top": [
16
+ 3,
17
+ 480,
18
+ 640
19
+ ],
20
+ "observation.state": [
21
+ 14
22
+ ]
23
+ },
24
+ "kl_weight": 10.0,
25
+ "latent_dim": 32,
26
+ "n_action_steps": 100,
27
+ "n_decoder_layers": 1,
28
+ "n_encoder_layers": 4,
29
+ "n_heads": 8,
30
+ "n_obs_steps": 1,
31
+ "n_vae_encoder_layers": 4,
32
+ "output_normalization_modes": {
33
+ "action": "mean_std"
34
+ },
35
+ "output_shapes": {
36
+ "action": [
37
+ 14
38
+ ]
39
+ },
40
+ "pre_norm": false,
41
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
42
+ "replace_final_stride_with_dilation": false,
43
+ "temporal_ensemble_coeff": null,
44
+ "use_vae": true,
45
+ "vision_backbone": "resnet18"
46
+ }
config.yaml ADDED
@@ -0,0 +1,227 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ resume: false
2
+ device: cuda
3
+ seed: 1000
4
+ dataset_repo_id:
5
+ - lerobot/aloha_sim_insertion_human
6
+ - lerobot/aloha_sim_transfer_cube_human
7
+ video_backend: pyav
8
+ training:
9
+ offline_steps: 100000
10
+ num_workers: 4
11
+ batch_size: 8
12
+ eval_freq: -1
13
+ log_freq: 200
14
+ save_checkpoint: true
15
+ save_freq: 20000
16
+ online_steps: 0
17
+ online_rollout_n_episodes: 1
18
+ online_rollout_batch_size: 1
19
+ online_steps_between_rollouts: 1
20
+ online_sampling_ratio: 0.5
21
+ online_env_seed: null
22
+ online_buffer_capacity: null
23
+ online_buffer_seed_size: 0
24
+ do_online_rollout_async: false
25
+ image_transforms:
26
+ enable: false
27
+ max_num_transforms: 3
28
+ random_order: false
29
+ brightness:
30
+ weight: 1
31
+ min_max:
32
+ - 0.8
33
+ - 1.2
34
+ contrast:
35
+ weight: 1
36
+ min_max:
37
+ - 0.8
38
+ - 1.2
39
+ saturation:
40
+ weight: 1
41
+ min_max:
42
+ - 0.5
43
+ - 1.5
44
+ hue:
45
+ weight: 1
46
+ min_max:
47
+ - -0.05
48
+ - 0.05
49
+ sharpness:
50
+ weight: 1
51
+ min_max:
52
+ - 0.8
53
+ - 1.2
54
+ lr: 1.0e-05
55
+ lr_backbone: 1.0e-05
56
+ weight_decay: 0.0001
57
+ grad_clip_norm: 10
58
+ delta_timestamps:
59
+ action:
60
+ - 0.0
61
+ - 0.02
62
+ - 0.04
63
+ - 0.06
64
+ - 0.08
65
+ - 0.1
66
+ - 0.12
67
+ - 0.14
68
+ - 0.16
69
+ - 0.18
70
+ - 0.2
71
+ - 0.22
72
+ - 0.24
73
+ - 0.26
74
+ - 0.28
75
+ - 0.3
76
+ - 0.32
77
+ - 0.34
78
+ - 0.36
79
+ - 0.38
80
+ - 0.4
81
+ - 0.42
82
+ - 0.44
83
+ - 0.46
84
+ - 0.48
85
+ - 0.5
86
+ - 0.52
87
+ - 0.54
88
+ - 0.56
89
+ - 0.58
90
+ - 0.6
91
+ - 0.62
92
+ - 0.64
93
+ - 0.66
94
+ - 0.68
95
+ - 0.7
96
+ - 0.72
97
+ - 0.74
98
+ - 0.76
99
+ - 0.78
100
+ - 0.8
101
+ - 0.82
102
+ - 0.84
103
+ - 0.86
104
+ - 0.88
105
+ - 0.9
106
+ - 0.92
107
+ - 0.94
108
+ - 0.96
109
+ - 0.98
110
+ - 1.0
111
+ - 1.02
112
+ - 1.04
113
+ - 1.06
114
+ - 1.08
115
+ - 1.1
116
+ - 1.12
117
+ - 1.14
118
+ - 1.16
119
+ - 1.18
120
+ - 1.2
121
+ - 1.22
122
+ - 1.24
123
+ - 1.26
124
+ - 1.28
125
+ - 1.3
126
+ - 1.32
127
+ - 1.34
128
+ - 1.36
129
+ - 1.38
130
+ - 1.4
131
+ - 1.42
132
+ - 1.44
133
+ - 1.46
134
+ - 1.48
135
+ - 1.5
136
+ - 1.52
137
+ - 1.54
138
+ - 1.56
139
+ - 1.58
140
+ - 1.6
141
+ - 1.62
142
+ - 1.64
143
+ - 1.66
144
+ - 1.68
145
+ - 1.7
146
+ - 1.72
147
+ - 1.74
148
+ - 1.76
149
+ - 1.78
150
+ - 1.8
151
+ - 1.82
152
+ - 1.84
153
+ - 1.86
154
+ - 1.88
155
+ - 1.9
156
+ - 1.92
157
+ - 1.94
158
+ - 1.96
159
+ - 1.98
160
+ eval:
161
+ n_episodes: 50
162
+ batch_size: 50
163
+ use_async_envs: false
164
+ wandb:
165
+ enable: true
166
+ disable_artifact: false
167
+ project: lerobot
168
+ notes: ''
169
+ fps: 50
170
+ env:
171
+ name: aloha
172
+ task: AlohaInsertion-v0
173
+ state_dim: 14
174
+ action_dim: 14
175
+ fps: ${fps}
176
+ episode_length: 400
177
+ gym:
178
+ obs_type: pixels_agent_pos
179
+ render_mode: rgb_array
180
+ override_dataset_stats:
181
+ observation.images.top:
182
+ mean:
183
+ - - - 0.485
184
+ - - - 0.456
185
+ - - - 0.406
186
+ std:
187
+ - - - 0.229
188
+ - - - 0.224
189
+ - - - 0.225
190
+ policy:
191
+ name: act
192
+ n_obs_steps: 1
193
+ chunk_size: 100
194
+ n_action_steps: 100
195
+ input_shapes:
196
+ observation.images.top:
197
+ - 3
198
+ - 480
199
+ - 640
200
+ observation.state:
201
+ - ${env.state_dim}
202
+ dataset_index:
203
+ - 1
204
+ output_shapes:
205
+ action:
206
+ - ${env.action_dim}
207
+ input_normalization_modes:
208
+ observation.images.top: mean_std
209
+ observation.state: mean_std
210
+ output_normalization_modes:
211
+ action: mean_std
212
+ vision_backbone: resnet18
213
+ pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
214
+ replace_final_stride_with_dilation: false
215
+ pre_norm: false
216
+ dim_model: 512
217
+ n_heads: 8
218
+ dim_feedforward: 3200
219
+ feedforward_activation: relu
220
+ n_encoder_layers: 4
221
+ n_decoder_layers: 1
222
+ use_vae: true
223
+ latent_dim: 32
224
+ n_vae_encoder_layers: 4
225
+ temporal_ensemble_coeff: null
226
+ dropout: 0.1
227
+ kl_weight: 10.0
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2a517d9903e125791e571ee1165e387a16ef40779217edb2c7435809a946228
3
+ size 206772824