Edson125 commited on
Commit
3c10b26
·
verified ·
1 Parent(s): 5ec8257

Upload 6 files

Browse files
_DATA/data/mano/MANO_RIGHT.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45d60aa3b27ef9107a7afd4e00808f307fd91111e1cfa35afd5c4a62de264767
3
+ size 3821356
_DATA/data/mano_mean_params.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efc0ec58e4a5cef78f3abfb4e8f91623b8950be9eff8b8e0dbb0d036ebc63988
3
+ size 1178
_DATA/hamer_ckpts/checkpoints/hamer.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5cc06f294d88a92dee24e603480aab04de532b49f0e08200804ee7d90e16f53
3
+ size 2689536166
_DATA/hamer_ckpts/dataset_config.yaml ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ COCOW-TRAIN:
2
+ TYPE: ImageDataset
3
+ URLS: hamer_training_data/dataset_tars/cocow-train/{000000..000036}.tar
4
+ epoch_size: 78666
5
+ DEX-TRAIN:
6
+ TYPE: ImageDataset
7
+ URLS: hamer_training_data/dataset_tars/dex-train/{000000..000406}.tar
8
+ epoch_size: 406888
9
+ FREIHAND-MOCAP:
10
+ DATASET_FILE: hamer_training_data/freihand_mocap.npz
11
+ FREIHAND-TRAIN:
12
+ TYPE: ImageDataset
13
+ URLS: hamer_training_data/dataset_tars/freihand-train/{000000..000130}.tar
14
+ epoch_size: 130240
15
+ H2O3D-TRAIN:
16
+ TYPE: ImageDataset
17
+ URLS: hamer_training_data/dataset_tars/h2o3d-train/{000000..000060}.tar
18
+ epoch_size: 121996
19
+ HALPE-TRAIN:
20
+ TYPE: ImageDataset
21
+ URLS: hamer_training_data/dataset_tars/halpe-train/{000000..000022}.tar
22
+ epoch_size: 34289
23
+ HO3D-TRAIN:
24
+ TYPE: ImageDataset
25
+ URLS: hamer_training_data/dataset_tars/ho3d-train/{000000..000083}.tar
26
+ epoch_size: 83325
27
+ INTERHAND26M-TRAIN:
28
+ TYPE: ImageDataset
29
+ URLS: hamer_training_data/dataset_tars/interhand26m-train/{000000..001056}.tar
30
+ epoch_size: 1424632
31
+ MPIINZSL-TRAIN:
32
+ TYPE: ImageDataset
33
+ URLS: hamer_training_data/dataset_tars/mpiinzsl-train/{000000..000015}.tar
34
+ epoch_size: 15184
35
+ MTC-TRAIN:
36
+ TYPE: ImageDataset
37
+ URLS: hamer_training_data/dataset_tars/mtc-train/{000000..000306}.tar
38
+ epoch_size: 363947
39
+ RHD-TRAIN:
40
+ TYPE: ImageDataset
41
+ URLS: hamer_training_data/dataset_tars/rhd-train/{000000..000041}.tar
42
+ epoch_size: 61705
_DATA/hamer_ckpts/model_config.yaml ADDED
@@ -0,0 +1,111 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task_name: train
2
+ tags:
3
+ - dev
4
+ train: true
5
+ test: false
6
+ ckpt_path: null
7
+ seed: null
8
+ DATASETS:
9
+ TRAIN:
10
+ FREIHAND-TRAIN:
11
+ WEIGHT: 0.25
12
+ INTERHAND26M-TRAIN:
13
+ WEIGHT: 0.25
14
+ MTC-TRAIN:
15
+ WEIGHT: 0.1
16
+ RHD-TRAIN:
17
+ WEIGHT: 0.05
18
+ COCOW-TRAIN:
19
+ WEIGHT: 0.1
20
+ HALPE-TRAIN:
21
+ WEIGHT: 0.05
22
+ MPIINZSL-TRAIN:
23
+ WEIGHT: 0.05
24
+ HO3D-TRAIN:
25
+ WEIGHT: 0.05
26
+ H2O3D-TRAIN:
27
+ WEIGHT: 0.05
28
+ DEX-TRAIN:
29
+ WEIGHT: 0.05
30
+ VAL:
31
+ FREIHAND-TRAIN:
32
+ WEIGHT: 1.0
33
+ MOCAP: FREIHAND-MOCAP
34
+ BETAS_REG: true
35
+ CONFIG:
36
+ SCALE_FACTOR: 0.3
37
+ ROT_FACTOR: 30
38
+ TRANS_FACTOR: 0.02
39
+ COLOR_SCALE: 0.2
40
+ ROT_AUG_RATE: 0.6
41
+ TRANS_AUG_RATE: 0.5
42
+ DO_FLIP: false
43
+ FLIP_AUG_RATE: 0.0
44
+ EXTREME_CROP_AUG_RATE: 0.0
45
+ EXTREME_CROP_AUG_LEVEL: 1
46
+ extras:
47
+ ignore_warnings: false
48
+ enforce_tags: true
49
+ print_config: true
50
+ exp_name: hamer
51
+ MANO:
52
+ DATA_DIR: _DATA/data/
53
+ MODEL_PATH: data/mano
54
+ GENDER: neutral
55
+ NUM_HAND_JOINTS: 15
56
+ MEAN_PARAMS: data/mano_mean_params.npz
57
+ CREATE_BODY_POSE: false
58
+ EXTRA:
59
+ FOCAL_LENGTH: 5000
60
+ NUM_LOG_IMAGES: 4
61
+ NUM_LOG_SAMPLES_PER_IMAGE: 8
62
+ PELVIS_IND: 0
63
+ GENERAL:
64
+ TOTAL_STEPS: 1000000
65
+ LOG_STEPS: 1000
66
+ VAL_STEPS: 1000
67
+ CHECKPOINT_STEPS: 10000
68
+ CHECKPOINT_SAVE_TOP_K: 1
69
+ NUM_WORKERS: 8
70
+ PREFETCH_FACTOR: 2
71
+ TRAIN:
72
+ LR: 1.0e-05
73
+ WEIGHT_DECAY: 0.0001
74
+ BATCH_SIZE: 32
75
+ LOSS_REDUCTION: mean
76
+ NUM_TRAIN_SAMPLES: 2
77
+ NUM_TEST_SAMPLES: 64
78
+ POSE_2D_NOISE_RATIO: 0.01
79
+ SMPL_PARAM_NOISE_RATIO: 0.005
80
+ MODEL:
81
+ IMAGE_SIZE: 256
82
+ IMAGE_MEAN:
83
+ - 0.485
84
+ - 0.456
85
+ - 0.406
86
+ IMAGE_STD:
87
+ - 0.229
88
+ - 0.224
89
+ - 0.225
90
+ BACKBONE:
91
+ TYPE: vit
92
+ PRETRAINED_WEIGHTS: hamer_training_data/vitpose_backbone.pth
93
+ MANO_HEAD:
94
+ TYPE: transformer_decoder
95
+ IN_CHANNELS: 2048
96
+ TRANSFORMER_DECODER:
97
+ depth: 6
98
+ heads: 8
99
+ mlp_dim: 1024
100
+ dim_head: 64
101
+ dropout: 0.0
102
+ emb_dropout: 0.0
103
+ norm: layer
104
+ context_dim: 1280
105
+ LOSS_WEIGHTS:
106
+ KEYPOINTS_3D: 0.05
107
+ KEYPOINTS_2D: 0.01
108
+ GLOBAL_ORIENT: 0.001
109
+ HAND_POSE: 0.001
110
+ BETAS: 0.0005
111
+ ADVERSARIAL: 0.0005
_DATA/vitpose_ckpts/vitpose+_huge/wholebody.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0555e1e2392e6a2be2d9265368f344d70ccbfd656ad480aa5c1de2e604519c9
3
+ size 3807742341