carohiguera's picture
added force field decoder for gelsight
ebd4d0b
raw
history blame
4.2 kB
paths:
data_root: /media/chiguera/GUM/
encoder_checkpoint_root: /media/chiguera/2TB/sparsh/encoders_460k/
log_dir: /media/chiguera/GUM/tactile_ssl/outputs_sparsh/${experiment_name}/logs/
output_dir: /media/chiguera/GUM/tactile_ssl/outputs_sparsh/${experiment_name}/
work_dir: ${hydra:runtime.cwd}
wandb:
project: ${task_name}_${sensor}
entity: chiguera
save_dir: ${paths.output_dir}
id: ${hydra:job.id}_${experiment_name}
tags:
- ${ssl_name}
group: null
notes: null
data:
train_val_split: null
train_data_budget: ${train_data_budget}
val_data_budget: ${val_data_budget}
max_train_data: null
sensor: gelsight_mini
dataset:
_target_: tactile_ssl.data.vision_tactile_forcefield.VisionTactileBackboneDataset
config:
sensor: ${data.sensor}
remove_bg: true
out_format: concat_ch_img
num_frames: 2
frame_stride: 5
path_dataset: ${paths.data_root}/datasets/gelsight/Object-Slide/
path_bgs: ${paths.data_root}/datasets/gelsight/Object-Slide/bgs/
list_datasets:
- strawberry/dataset_0
- strawberry/dataset_1
- strawberry/dataset_2
- plum/dataset_0
- plum/dataset_1
- plum/dataset_2
- icecream_cup/dataset_0
- icecream_cup/dataset_1
- icecream_cup/dataset_2
- donut/dataset_0
- donut/dataset_1
- donut/dataset_2
- cookie2/dataset_0
- cookie2/dataset_1
- cookie2/dataset_2
- bread/dataset_0
- bread/dataset_1
- bread/dataset_2
- banana/dataset_0
- banana/dataset_1
- banana/dataset_2
- bagel/dataset_0
- bagel/dataset_1
- bagel/dataset_2
list_datasets_test:
- bagel/dataset_3
- banana/dataset_3
- bread/dataset_3
- cookie2/dataset_3
- donut/dataset_3
- icecream_cup/dataset_3
- plum/dataset_3
- strawberry/dataset_3
look_in_folder: false
transforms:
with_augmentation: false
resize:
- 224
- 224
p_flip: 0.0
p_crop: 0.0
p_rot: 0.0
train_dataloader:
batch_size: 20
num_workers: 2
drop_last: true
pin_memory: true
persistent_workers: true
shuffle: true
val_dataloader:
batch_size: 20
num_workers: 2
drop_last: true
pin_memory: true
persistent_workers: true
task:
_target_: tactile_ssl.downstream_task.ForceFieldModuleSL
model_encoder:
_target_: tactile_ssl.model.vit_${ssl_model_size}
img_size:
- 224
- 224
in_chans: 6
pos_embed_fn: sinusoidal
num_register_tokens: 1
model_task:
_target_: tactile_ssl.downstream_task.ForceFieldDecoderSL
embed_dim: ${ssl_model_size}
checkpoint_encoder: ${paths.encoder_checkpoint_root}/${ssl_name}_vit${ssl_model_size}.ckpt
checkpoint_task: /media/chiguera/GUM/tactile_ssl/outputs_sparsh/digit_t1_forcefield_dino_vitbase_bg/checkpoints/epoch-0031.pth
train_encoder: false
optim_cfg:
_partial_: true
_target_: torch.optim.Adam
lr: 0.0001
scheduler_cfg: null
ssl_config:
img_sz:
- 224
- 224
pose_estimator:
num_encoder_layers: 18
loss:
with_mask_supervision: false
with_sl_supervision: false
with_ssim: true
disparity_smoothness: 0.001
min_depth: 0.1
max_depth: 100.0
encoder_type: ${ssl_name}
ssl_name: dino
sensor: gelsight
ckpt_path: null
task_name: t1_forcefield
ssl_model_size: base
train_data_budget: 1.0
val_data_budget: 1.0
experiment_name: ${sensor}_${task_name}_${ssl_name}_vit${ssl_model_size}_bg
seed: 42
data_out_format: concat_ch_img
num_frames: 2
frame_stride: 5
trainer:
max_epochs: 21
validation_frequency: 2
sanity_validate: false
save_checkpoint_dir: ${paths.output_dir}/checkpoints
checkpoint_interval_type: log
max_task_checkpoints: 10
save_probe_weights_only: true
limit_train_batches: 500
limit_val_batches: 150
use_distributed_sampler: false
devices:
- 0
test:
data:
dataset_name:
- cookie2/dataset_0
batch_size: 1
tester:
_partial_: true
_target_: tactile_ssl.test.TestForceField
demo:
_partial_: true
_target_: tactile_ssl.test.DemoForceField
path_outputs: null