Spaces:
Running
on
Zero
Running
on
Zero
task_name: train | |
tags: | |
- dev | |
train: true | |
test: false | |
ckpt_path: null | |
seed: null | |
DATASETS: | |
TRAIN: | |
FREIHAND-TRAIN: | |
WEIGHT: 0.2 | |
INTERHAND26M-TRAIN: | |
WEIGHT: 0.1 | |
MTC-TRAIN: | |
WEIGHT: 0.05 | |
RHD-TRAIN: | |
WEIGHT: 0.05 | |
COCOW-TRAIN: | |
WEIGHT: 0.05 | |
HALPE-TRAIN: | |
WEIGHT: 0.05 | |
MPIINZSL-TRAIN: | |
WEIGHT: 0.05 | |
HO3D-TRAIN: | |
WEIGHT: 0.05 | |
H2O3D-TRAIN: | |
WEIGHT: 0.05 | |
DEX-TRAIN: | |
WEIGHT: 0.05 | |
BEDLAM-TRAIN: | |
WEIGHT: 0.05 | |
REINTER-TRAIN: | |
WEIGHT: 0.1 | |
HOT3D-TRAIN: | |
WEIGHT: 0.05 | |
ARCTIC-TRAIN: | |
WEIGHT: 0.1 | |
VAL: | |
FREIHAND-TRAIN: | |
WEIGHT: 1.0 | |
MOCAP: FREIHAND-MOCAP | |
BETAS_REG: true | |
CONFIG: | |
SCALE_FACTOR: 0.3 | |
ROT_FACTOR: 30 | |
TRANS_FACTOR: 0.02 | |
COLOR_SCALE: 0.2 | |
ROT_AUG_RATE: 0.6 | |
TRANS_AUG_RATE: 0.5 | |
DO_FLIP: false | |
FLIP_AUG_RATE: 0.0 | |
EXTREME_CROP_AUG_RATE: 0.0 | |
EXTREME_CROP_AUG_LEVEL: 1 | |
extras: | |
ignore_warnings: false | |
enforce_tags: true | |
print_config: true | |
exp_name: WiLoR | |
MANO: | |
DATA_DIR: mano_data | |
MODEL_PATH: ${MANO.DATA_DIR}/mano | |
GENDER: neutral | |
NUM_HAND_JOINTS: 15 | |
MEAN_PARAMS: ${MANO.DATA_DIR}/mano_mean_params.npz | |
CREATE_BODY_POSE: false | |
EXTRA: | |
FOCAL_LENGTH: 5000 | |
NUM_LOG_IMAGES: 4 | |
NUM_LOG_SAMPLES_PER_IMAGE: 8 | |
PELVIS_IND: 0 | |
GENERAL: | |
TOTAL_STEPS: 1000000 | |
LOG_STEPS: 1000 | |
VAL_STEPS: 1000 | |
CHECKPOINT_STEPS: 1000 | |
CHECKPOINT_SAVE_TOP_K: 1 | |
NUM_WORKERS: 8 | |
PREFETCH_FACTOR: 2 | |
TRAIN: | |
LR: 1.0e-05 | |
WEIGHT_DECAY: 0.0001 | |
BATCH_SIZE: 32 | |
LOSS_REDUCTION: mean | |
NUM_TRAIN_SAMPLES: 2 | |
NUM_TEST_SAMPLES: 64 | |
POSE_2D_NOISE_RATIO: 0.01 | |
SMPL_PARAM_NOISE_RATIO: 0.005 | |
MODEL: | |
IMAGE_SIZE: 256 | |
IMAGE_MEAN: | |
- 0.485 | |
- 0.456 | |
- 0.406 | |
IMAGE_STD: | |
- 0.229 | |
- 0.224 | |
- 0.225 | |
BACKBONE: | |
TYPE: vit | |
PRETRAINED_WEIGHTS: training_data/vitpose_backbone.pth | |
MANO_HEAD: | |
TYPE: transformer_decoder | |
IN_CHANNELS: 2048 | |
TRANSFORMER_DECODER: | |
depth: 6 | |
heads: 8 | |
mlp_dim: 1024 | |
dim_head: 64 | |
dropout: 0.0 | |
emb_dropout: 0.0 | |
norm: layer | |
context_dim: 1280 | |
LOSS_WEIGHTS: | |
KEYPOINTS_3D: 0.05 | |
KEYPOINTS_2D: 0.01 | |
GLOBAL_ORIENT: 0.001 | |
HAND_POSE: 0.001 | |
BETAS: 0.0005 | |
ADVERSARIAL: 0.0005 | |