ThunderVVV commited on
Commit
91208ec
·
1 Parent(s): e4b612a
droid.pth → external/droid.pth RENAMED
File without changes
wilor_detector.pt → external/wilor_detector.pt RENAMED
File without changes
hawor/checkpoints/hawor.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09ba92725cc7ed5973f2cafb7ec8cf6a6d40a967c1eba708f5c1f8d54896e593
3
+ size 3267484388
hawor/checkpoints/infiller.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30715e7e72e91d4e164bb762c7ea613dcff5448dbda5fabf40b4054e408cc5c2
3
+ size 418603497
hawor/model_config.yaml ADDED
@@ -0,0 +1,140 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task_name: train
2
+ tags:
3
+ - dev
4
+ train: true
5
+ auto_resume: true
6
+ test: false
7
+ ckpt_path: null
8
+ seed: null
9
+ DATASETS:
10
+ SUPPRESS_KP_CONF_THRESH: 0.3
11
+ FILTER_NUM_KP: 4
12
+ FILTER_NUM_KP_THRESH: 0.0
13
+ FILTER_REPROJ_THRESH: 31000
14
+ SUPPRESS_BETAS_THRESH: 3.0
15
+ SUPPRESS_BAD_POSES: false
16
+ POSES_BETAS_SIMULTANEOUS: true
17
+ FILTER_NO_POSES: false
18
+ TRAIN:
19
+ MULTI_SET: true
20
+ HOT3D_TRAIN:
21
+ WEIGHT: 1.0
22
+ ROOT: hot3d_trainset_export
23
+ PKL: train_set_new.pkl
24
+ ARCTIC_TRAIN:
25
+ WEIGHT: 1.0
26
+ ROOT: arctic_trainset_export
27
+ PKL: train_set_new.pkl
28
+ DEXYCB_TRAIN:
29
+ WEIGHT: 1.0
30
+ ROOT: dex_ycb_trainset_export
31
+ PKL: train_set_new.pkl
32
+ HO3D_TRAIN:
33
+ WEIGHT: 1.0
34
+ ROOT: ho3d_trainset_export
35
+ PKL: train_set_new.pkl
36
+ VAL:
37
+ HOT3D_TEST:
38
+ WEIGHT: 1.0
39
+ BETAS_REG: true
40
+ CONFIG:
41
+ SCALE_FACTOR: 0.3
42
+ ROT_FACTOR: 30
43
+ TRANS_FACTOR: 0.02
44
+ COLOR_SCALE: 0.2
45
+ ROT_AUG_RATE: 0.6
46
+ TRANS_AUG_RATE: 0.5
47
+ DO_FLIP: false
48
+ FLIP_AUG_RATE: 0.0
49
+ EXTREME_CROP_AUG_RATE: 0.0
50
+ EXTREME_CROP_AUG_LEVEL: 1
51
+ trainer:
52
+ _target_: pytorch_lightning.Trainer
53
+ default_root_dir: /home/bml/.storage/mnt/v-f028498a5029402d/org/zjl/model_hand/logs/train/runs/hamer_vimo_b8_g4_4set
54
+ accelerator: gpu
55
+ devices: 4
56
+ deterministic: false
57
+ num_sanity_val_steps: 0
58
+ log_every_n_steps: 1000
59
+ val_check_interval: 0
60
+ precision: 16
61
+ max_steps: 250000
62
+ limit_val_batches: 0
63
+ paths:
64
+ root_dir: /home/bml/.storage/mnt/v-f028498a5029402d/org/zjl/model_hand
65
+ data_dir: /home/bml/.storage/mnt/v-f028498a5029402d/org/zjl/model_hand/data/
66
+ log_dir: logs/
67
+ output_dir: /home/bml/.storage/mnt/v-f028498a5029402d/org/zjl/model_hand/logs/train/runs/hamer_vimo_b8_g4_4set
68
+ work_dir: /home/bml/.storage/mnt/v-f028498a5029402d/org/zjl/model_hand
69
+ extras:
70
+ ignore_warnings: false
71
+ enforce_tags: true
72
+ print_config: true
73
+ exp_name: hamer_vimo_b8_g4_4set
74
+ MANO:
75
+ DATA_DIR: _DATA/data/
76
+ MODEL_PATH: _DATA/data//mano
77
+ GENDER: neutral
78
+ NUM_HAND_JOINTS: 15
79
+ MEAN_PARAMS: _DATA/data//mano_mean_params.npz
80
+ CREATE_BODY_POSE: false
81
+ EXTRA:
82
+ FOCAL_LENGTH: 5000
83
+ NUM_LOG_IMAGES: 4
84
+ NUM_LOG_SAMPLES_PER_IMAGE: 8
85
+ PELVIS_IND: 0
86
+ GENERAL:
87
+ TOTAL_STEPS: 250000
88
+ LOG_STEPS: 1000
89
+ VAL_STEPS: 0
90
+ CHECKPOINT_STEPS: 1000
91
+ CHECKPOINT_SAVE_TOP_K: 1
92
+ NUM_WORKERS: 25
93
+ PREFETCH_FACTOR: 2
94
+ TRAIN:
95
+ LR: 1.0e-05
96
+ WEIGHT_DECAY: 0.0001
97
+ BATCH_SIZE: 8
98
+ LOSS_REDUCTION: mean
99
+ NUM_TRAIN_SAMPLES: 2
100
+ NUM_TEST_SAMPLES: 64
101
+ POSE_2D_NOISE_RATIO: 0.01
102
+ SMPL_PARAM_NOISE_RATIO: 0.005
103
+ MODEL:
104
+ IMAGE_SIZE: 256
105
+ IMAGE_MEAN:
106
+ - 0.485
107
+ - 0.456
108
+ - 0.406
109
+ IMAGE_STD:
110
+ - 0.229
111
+ - 0.224
112
+ - 0.225
113
+ BACKBONE:
114
+ TYPE: vit
115
+ TORCH_COMPILE: 0
116
+ PRETRAINED_WEIGHTS: _DATA/hamer_ckpts/checkpoints/hamer.ckpt
117
+ MANO_HEAD:
118
+ TYPE: transformer_decoder
119
+ IN_CHANNELS: 2048
120
+ TRANSFORMER_DECODER:
121
+ depth: 6
122
+ heads: 8
123
+ mlp_dim: 1024
124
+ dim_head: 64
125
+ dropout: 0.0
126
+ emb_dropout: 0.0
127
+ norm: layer
128
+ context_dim: 1280
129
+ ST_MODULE: true
130
+ MOTION_MODULE: true
131
+ ST_HDIM: 512
132
+ MOTION_HDIM: 384
133
+ ST_NLAYER: 6
134
+ MOTION_NLAYER: 6
135
+ LOSS_WEIGHTS:
136
+ KEYPOINTS_3D: 0.05
137
+ KEYPOINTS_2D: 0.01
138
+ GLOBAL_ORIENT: 0.001
139
+ HAND_POSE: 0.001
140
+ BETAS: 0.0005