Spaces:
Running
on
Zero
Running
on
Zero
| task_name: train | |
| tags: | |
| - dev | |
| train: true | |
| test: false | |
| ckpt_path: null | |
| seed: null | |
| DATASETS: | |
| TRAIN: | |
| FREIHAND-TRAIN: | |
| WEIGHT: 0.2 | |
| INTERHAND26M-TRAIN: | |
| WEIGHT: 0.1 | |
| MTC-TRAIN: | |
| WEIGHT: 0.05 | |
| RHD-TRAIN: | |
| WEIGHT: 0.05 | |
| COCOW-TRAIN: | |
| WEIGHT: 0.05 | |
| HALPE-TRAIN: | |
| WEIGHT: 0.05 | |
| MPIINZSL-TRAIN: | |
| WEIGHT: 0.05 | |
| HO3D-TRAIN: | |
| WEIGHT: 0.05 | |
| H2O3D-TRAIN: | |
| WEIGHT: 0.05 | |
| DEX-TRAIN: | |
| WEIGHT: 0.05 | |
| BEDLAM-TRAIN: | |
| WEIGHT: 0.05 | |
| REINTER-TRAIN: | |
| WEIGHT: 0.1 | |
| HOT3D-TRAIN: | |
| WEIGHT: 0.05 | |
| ARCTIC-TRAIN: | |
| WEIGHT: 0.1 | |
| VAL: | |
| FREIHAND-TRAIN: | |
| WEIGHT: 1.0 | |
| MOCAP: FREIHAND-MOCAP | |
| BETAS_REG: true | |
| CONFIG: | |
| SCALE_FACTOR: 0.3 | |
| ROT_FACTOR: 30 | |
| TRANS_FACTOR: 0.02 | |
| COLOR_SCALE: 0.2 | |
| ROT_AUG_RATE: 0.6 | |
| TRANS_AUG_RATE: 0.5 | |
| DO_FLIP: false | |
| FLIP_AUG_RATE: 0.0 | |
| EXTREME_CROP_AUG_RATE: 0.0 | |
| EXTREME_CROP_AUG_LEVEL: 1 | |
| extras: | |
| ignore_warnings: false | |
| enforce_tags: true | |
| print_config: true | |
| exp_name: WiLoR | |
| MANO: | |
| DATA_DIR: mano_data | |
| MODEL_PATH: ${MANO.DATA_DIR}/mano | |
| GENDER: neutral | |
| NUM_HAND_JOINTS: 15 | |
| MEAN_PARAMS: ${MANO.DATA_DIR}/mano_mean_params.npz | |
| CREATE_BODY_POSE: false | |
| EXTRA: | |
| FOCAL_LENGTH: 5000 | |
| NUM_LOG_IMAGES: 4 | |
| NUM_LOG_SAMPLES_PER_IMAGE: 8 | |
| PELVIS_IND: 0 | |
| GENERAL: | |
| TOTAL_STEPS: 1000000 | |
| LOG_STEPS: 1000 | |
| VAL_STEPS: 1000 | |
| CHECKPOINT_STEPS: 1000 | |
| CHECKPOINT_SAVE_TOP_K: 1 | |
| NUM_WORKERS: 8 | |
| PREFETCH_FACTOR: 2 | |
| TRAIN: | |
| LR: 1.0e-05 | |
| WEIGHT_DECAY: 0.0001 | |
| BATCH_SIZE: 32 | |
| LOSS_REDUCTION: mean | |
| NUM_TRAIN_SAMPLES: 2 | |
| NUM_TEST_SAMPLES: 64 | |
| POSE_2D_NOISE_RATIO: 0.01 | |
| SMPL_PARAM_NOISE_RATIO: 0.005 | |
| MODEL: | |
| IMAGE_SIZE: 256 | |
| IMAGE_MEAN: | |
| - 0.485 | |
| - 0.456 | |
| - 0.406 | |
| IMAGE_STD: | |
| - 0.229 | |
| - 0.224 | |
| - 0.225 | |
| BACKBONE: | |
| TYPE: vit | |
| PRETRAINED_WEIGHTS: training_data/vitpose_backbone.pth | |
| MANO_HEAD: | |
| TYPE: transformer_decoder | |
| IN_CHANNELS: 2048 | |
| TRANSFORMER_DECODER: | |
| depth: 6 | |
| heads: 8 | |
| mlp_dim: 1024 | |
| dim_head: 64 | |
| dropout: 0.0 | |
| emb_dropout: 0.0 | |
| norm: layer | |
| context_dim: 1280 | |
| LOSS_WEIGHTS: | |
| KEYPOINTS_3D: 0.05 | |
| KEYPOINTS_2D: 0.01 | |
| GLOBAL_ORIENT: 0.001 | |
| HAND_POSE: 0.001 | |
| BETAS: 0.0005 | |
| ADVERSARIAL: 0.0005 | |