SondosM commited on
Commit
44b1214
·
verified ·
1 Parent(s): 989560f

Upload folder using huggingface_hub

Browse files
pretrained_models/pretrained_models/detector.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ef3df44e42d2db52d4ffe91f83a22ce9925e2acc9abebf453f2c5d22e380033
3
+ size 53582271
pretrained_models/pretrained_models/model_config.yaml ADDED
@@ -0,0 +1,119 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task_name: train
2
+ tags:
3
+ - dev
4
+ train: true
5
+ test: false
6
+ ckpt_path: null
7
+ seed: null
8
+ DATASETS:
9
+ TRAIN:
10
+ FREIHAND-TRAIN:
11
+ WEIGHT: 0.2
12
+ INTERHAND26M-TRAIN:
13
+ WEIGHT: 0.1
14
+ MTC-TRAIN:
15
+ WEIGHT: 0.05
16
+ RHD-TRAIN:
17
+ WEIGHT: 0.05
18
+ COCOW-TRAIN:
19
+ WEIGHT: 0.05
20
+ HALPE-TRAIN:
21
+ WEIGHT: 0.05
22
+ MPIINZSL-TRAIN:
23
+ WEIGHT: 0.05
24
+ HO3D-TRAIN:
25
+ WEIGHT: 0.05
26
+ H2O3D-TRAIN:
27
+ WEIGHT: 0.05
28
+ DEX-TRAIN:
29
+ WEIGHT: 0.05
30
+ BEDLAM-TRAIN:
31
+ WEIGHT: 0.05
32
+ REINTER-TRAIN:
33
+ WEIGHT: 0.1
34
+ HOT3D-TRAIN:
35
+ WEIGHT: 0.05
36
+ ARCTIC-TRAIN:
37
+ WEIGHT: 0.1
38
+ VAL:
39
+ FREIHAND-TRAIN:
40
+ WEIGHT: 1.0
41
+ MOCAP: FREIHAND-MOCAP
42
+ BETAS_REG: true
43
+ CONFIG:
44
+ SCALE_FACTOR: 0.3
45
+ ROT_FACTOR: 30
46
+ TRANS_FACTOR: 0.02
47
+ COLOR_SCALE: 0.2
48
+ ROT_AUG_RATE: 0.6
49
+ TRANS_AUG_RATE: 0.5
50
+ DO_FLIP: false
51
+ FLIP_AUG_RATE: 0.0
52
+ EXTREME_CROP_AUG_RATE: 0.0
53
+ EXTREME_CROP_AUG_LEVEL: 1
54
+ extras:
55
+ ignore_warnings: false
56
+ enforce_tags: true
57
+ print_config: true
58
+ exp_name: WiLoR
59
+ MANO:
60
+ DATA_DIR: mano_data
61
+ MODEL_PATH: ${MANO.DATA_DIR}
62
+ GENDER: neutral
63
+ NUM_HAND_JOINTS: 15
64
+ MEAN_PARAMS: ${MANO.DATA_DIR}/mano_mean_params.npz
65
+ CREATE_BODY_POSE: false
66
+ EXTRA:
67
+ FOCAL_LENGTH: 5000
68
+ NUM_LOG_IMAGES: 4
69
+ NUM_LOG_SAMPLES_PER_IMAGE: 8
70
+ PELVIS_IND: 0
71
+ GENERAL:
72
+ TOTAL_STEPS: 1000000
73
+ LOG_STEPS: 1000
74
+ VAL_STEPS: 1000
75
+ CHECKPOINT_STEPS: 1000
76
+ CHECKPOINT_SAVE_TOP_K: 1
77
+ NUM_WORKERS: 8
78
+ PREFETCH_FACTOR: 2
79
+ TRAIN:
80
+ LR: 1.0e-05
81
+ WEIGHT_DECAY: 0.0001
82
+ BATCH_SIZE: 32
83
+ LOSS_REDUCTION: mean
84
+ NUM_TRAIN_SAMPLES: 2
85
+ NUM_TEST_SAMPLES: 64
86
+ POSE_2D_NOISE_RATIO: 0.01
87
+ SMPL_PARAM_NOISE_RATIO: 0.005
88
+ MODEL:
89
+ IMAGE_SIZE: 256
90
+ IMAGE_MEAN:
91
+ - 0.485
92
+ - 0.456
93
+ - 0.406
94
+ IMAGE_STD:
95
+ - 0.229
96
+ - 0.224
97
+ - 0.225
98
+ BACKBONE:
99
+ TYPE: vit
100
+ PRETRAINED_WEIGHTS: training_data/vitpose_backbone.pth
101
+ MANO_HEAD:
102
+ TYPE: transformer_decoder
103
+ IN_CHANNELS: 2048
104
+ TRANSFORMER_DECODER:
105
+ depth: 6
106
+ heads: 8
107
+ mlp_dim: 1024
108
+ dim_head: 64
109
+ dropout: 0.0
110
+ emb_dropout: 0.0
111
+ norm: layer
112
+ context_dim: 1280
113
+ LOSS_WEIGHTS:
114
+ KEYPOINTS_3D: 0.05
115
+ KEYPOINTS_2D: 0.01
116
+ GLOBAL_ORIENT: 0.001
117
+ HAND_POSE: 0.001
118
+ BETAS: 0.0005
119
+ ADVERSARIAL: 0.0005
pretrained_models/pretrained_models/wilor_final.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e97aafc7dd08d883a4cc5a027df61fdb6fda6136dbd1319405413862ada6bb2
3
+ size 2564989533