Ceveloper
commited on
Commit
·
98f391d
1
Parent(s):
449ae80
Models uploaded
Browse files- trained_models/hmp/amass-mano/autoencoder/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/amass-mano/autoencoder/config.yaml +113 -0
- trained_models/hmp/amass-mano/diffusion/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/amass-mano/diffusion/config.yaml +56 -0
- trained_models/hmp/amass/autoencoder/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/amass/autoencoder/config.yaml +114 -0
- trained_models/hmp/amass/diffusion/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/amass/diffusion/config.yaml +56 -0
- trained_models/hmp/freeman/autoencoder/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/freeman/autoencoder/config.yaml +87 -0
- trained_models/hmp/freeman/diffusion/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/freeman/diffusion/config.yaml +56 -0
- trained_models/hmp/h36m/autoencoder/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/h36m/autoencoder/config.yaml +102 -0
- trained_models/hmp/h36m/diffusion/checkpoints/cvpr_release.pt +3 -0
- trained_models/hmp/h36m/diffusion/config.yaml +56 -0
trained_models/hmp/amass-mano/autoencoder/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b9cf7d9ea512af8d82779a835f25a0b1f8d3e11d73b37d732ff97936b8bc12a
|
| 3 |
+
size 111366357
|
trained_models/hmp/amass-mano/autoencoder/config.yaml
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
dataset_main_path: ./datasets
|
| 2 |
+
dataset_annotation_path: ./datasets/annotations
|
| 3 |
+
dataset_precomputed_path: ./datasets/processed
|
| 4 |
+
resume_training: false
|
| 5 |
+
device: cuda
|
| 6 |
+
load: false
|
| 7 |
+
load_path: ''
|
| 8 |
+
output_log_path: ./trained_models/hmp/amass-mano/autoencoder
|
| 9 |
+
batch_size: 64
|
| 10 |
+
batch_size_eval: 512
|
| 11 |
+
if_run_validation: False
|
| 12 |
+
eval_frequency: 25
|
| 13 |
+
num_epochs: 300
|
| 14 |
+
num_iteration_eval: 10
|
| 15 |
+
num_workers: 4
|
| 16 |
+
seed: 52345
|
| 17 |
+
use_lr_scheduler: true
|
| 18 |
+
lr_scheduler_kwargs:
|
| 19 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 20 |
+
warmup_duration: 10
|
| 21 |
+
update_every: 1
|
| 22 |
+
min_lr: 0.0001
|
| 23 |
+
gamma_decay: 0.98
|
| 24 |
+
loss_pose_type: l1
|
| 25 |
+
lr: 0.005
|
| 26 |
+
latent_size: 96
|
| 27 |
+
output_size: 3
|
| 28 |
+
z_activation: tanh
|
| 29 |
+
num_iter_perepoch: 580
|
| 30 |
+
obs_length: 30
|
| 31 |
+
prediction_horizon_train: 120
|
| 32 |
+
prediction_horizon_eval: 120
|
| 33 |
+
prediction_horizon: 120
|
| 34 |
+
pred_length: 120
|
| 35 |
+
prediction_horizon_train_min: 10
|
| 36 |
+
prediction_horizon_train_min_from_epoch: 200
|
| 37 |
+
curriculum_it: 10
|
| 38 |
+
random_prediction_horizon: true
|
| 39 |
+
if_consider_hip: false
|
| 40 |
+
history_sec: 0.5
|
| 41 |
+
prediction_horizon_sec: 2
|
| 42 |
+
motion_repr_type: SkeletonRescalePose
|
| 43 |
+
pose_box_size: 1.2
|
| 44 |
+
seq_centering: 0
|
| 45 |
+
task_name: hmp
|
| 46 |
+
num_joints: 52
|
| 47 |
+
fps: 60
|
| 48 |
+
multimodal_threshold: 0.4
|
| 49 |
+
dataset_type: AMASSDataset
|
| 50 |
+
dataset_name: amass-mano
|
| 51 |
+
precomputed_folder: ./datasets/processed/AMASS-MANO/hmp
|
| 52 |
+
annotations_folder: ./datasets/annotations/AMASS-MANO/hmp
|
| 53 |
+
dtype: float32
|
| 54 |
+
data_loader_train:
|
| 55 |
+
stride: 60
|
| 56 |
+
augmentation: 30
|
| 57 |
+
shuffle: true
|
| 58 |
+
datasets:
|
| 59 |
+
- ACCAD
|
| 60 |
+
- BMLhandball
|
| 61 |
+
- BMLmovi
|
| 62 |
+
- BMLrub
|
| 63 |
+
- EKUT
|
| 64 |
+
- CMU
|
| 65 |
+
- EyesJapanDataset
|
| 66 |
+
- KIT
|
| 67 |
+
- PosePrior
|
| 68 |
+
- TCDHands
|
| 69 |
+
- TotalCapture
|
| 70 |
+
da_mirroring: 0.5
|
| 71 |
+
da_rotations: 1.0
|
| 72 |
+
drop_last: true
|
| 73 |
+
if_load_mmgt: false
|
| 74 |
+
data_loader_train_eval:
|
| 75 |
+
stride: 30
|
| 76 |
+
augmentation: 0
|
| 77 |
+
shuffle: false
|
| 78 |
+
datasets:
|
| 79 |
+
- ACCAD
|
| 80 |
+
- BMLhandball
|
| 81 |
+
- BMLmovi
|
| 82 |
+
- BMLrub
|
| 83 |
+
- EKUT
|
| 84 |
+
- CMU
|
| 85 |
+
- EyesJapanDataset
|
| 86 |
+
- KIT
|
| 87 |
+
- PosePrior
|
| 88 |
+
- TCDHands
|
| 89 |
+
- TotalCapture
|
| 90 |
+
da_mirroring: 0.0
|
| 91 |
+
da_rotations: 0.0
|
| 92 |
+
drop_last: false
|
| 93 |
+
if_load_mmgt: false
|
| 94 |
+
data_loader_valid:
|
| 95 |
+
stride: 30
|
| 96 |
+
augmentation: 0
|
| 97 |
+
shuffle: false
|
| 98 |
+
datasets:
|
| 99 |
+
- HumanEva
|
| 100 |
+
- HDM05
|
| 101 |
+
- SFU
|
| 102 |
+
- MoSh
|
| 103 |
+
file_idces: all
|
| 104 |
+
drop_last: false
|
| 105 |
+
if_load_mmgt: false
|
| 106 |
+
|
| 107 |
+
autoenc_arch:
|
| 108 |
+
enc_num_layers: 2
|
| 109 |
+
encoder_hidden_size: 96
|
| 110 |
+
decoder_hidden_size: 96
|
| 111 |
+
arch: AutoEncoder
|
| 112 |
+
recurrent_arch_enc: StaticGraphGRU
|
| 113 |
+
recurrent_arch_decoder: StaticGraphGRU
|
trained_models/hmp/amass-mano/diffusion/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a894bd0f79fa0accf46a6dd0e2686c47d2bc6796c03f0277b187a8cef12855e
|
| 3 |
+
size 394796990
|
trained_models/hmp/amass-mano/diffusion/config.yaml
ADDED
|
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
if_resume_training: false
|
| 2 |
+
device: cuda
|
| 3 |
+
load: false
|
| 4 |
+
load_path: ''
|
| 5 |
+
dataset_main_path: ./datasets
|
| 6 |
+
dataset_annotation_path: ./datasets/annotations
|
| 7 |
+
dataset_precomputed_path: ./datasets/processed
|
| 8 |
+
output_log_path: ./trained_models/hmp/amass-mano/diffusion
|
| 9 |
+
pretrained_autoencoder_path: ./trained_models/hmp/amass-mano/autoencoder/checkpoints/cvpr_release.pt
|
| 10 |
+
lr: 0.001
|
| 11 |
+
diffusion_objective: pred_x0
|
| 12 |
+
weight_decay: 0.0
|
| 13 |
+
if_use_ema: true
|
| 14 |
+
step_start_ema: 100
|
| 15 |
+
ema_power: 0.6666666666666666
|
| 16 |
+
ema_update_every: 10
|
| 17 |
+
ema_min_value: 0.0
|
| 18 |
+
use_lr_scheduler: true
|
| 19 |
+
lr_scheduler_kwargs:
|
| 20 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 21 |
+
warmup_duration: 75
|
| 22 |
+
update_every: 2
|
| 23 |
+
min_lr: 0.0001
|
| 24 |
+
gamma_decay: 0.98
|
| 25 |
+
diffusion_conditioning: true
|
| 26 |
+
num_epochs: 150
|
| 27 |
+
num_workers: 4
|
| 28 |
+
batch_size: 64
|
| 29 |
+
batch_size_eval: 256
|
| 30 |
+
eval_frequency: 25
|
| 31 |
+
train_pick_best_sample_among_k: 50
|
| 32 |
+
similarity_space: input_space
|
| 33 |
+
diffusion_activation: identity
|
| 34 |
+
num_prob_samples: 50
|
| 35 |
+
diffusion_timesteps: 10
|
| 36 |
+
diffusion_type: NonisotropicGaussianDiffusion
|
| 37 |
+
diffusion_loss_type: snr
|
| 38 |
+
loss_reduction_type: l1
|
| 39 |
+
if_run_as_isotropic: false
|
| 40 |
+
if_sigma_n_scale: true
|
| 41 |
+
diffusion_covariance_type: skeleton-diffusion
|
| 42 |
+
gamma_scheduler: cosine
|
| 43 |
+
beta_schedule: cosine
|
| 44 |
+
sigma_n_scale: spectral
|
| 45 |
+
num_iter_perepoch: null
|
| 46 |
+
seed: 63485
|
| 47 |
+
diffusion_arch:
|
| 48 |
+
arch: Denoiser
|
| 49 |
+
use_attention: true
|
| 50 |
+
self_condition: false
|
| 51 |
+
norm_type: none
|
| 52 |
+
depth: 4
|
| 53 |
+
attn_dim_head: 32
|
| 54 |
+
attn_heads: 8
|
| 55 |
+
learn_influence: true
|
| 56 |
+
covariance_matrix_type: adjacency
|
trained_models/hmp/amass/autoencoder/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f206a4108ce6ba1beec3f3e70f6b6092fb02a57c48f6c4b462a5d366d9518c5
|
| 3 |
+
size 33673173
|
trained_models/hmp/amass/autoencoder/config.yaml
ADDED
|
@@ -0,0 +1,114 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
dataset_main_path: ./datasets
|
| 2 |
+
dataset_annotation_path: ./datasets/annotations
|
| 3 |
+
dataset_precomputed_path: ./datasets/processed
|
| 4 |
+
resume_training: false
|
| 5 |
+
device: cuda
|
| 6 |
+
load: false
|
| 7 |
+
load_path: ''
|
| 8 |
+
output_log_path: ./trained_models/hmp/amass/autoencoder
|
| 9 |
+
batch_size: 64
|
| 10 |
+
batch_size_eval: 512
|
| 11 |
+
if_run_validation: False
|
| 12 |
+
eval_frequency: 25
|
| 13 |
+
num_epochs: 300
|
| 14 |
+
num_iteration_eval: 10
|
| 15 |
+
num_workers: 4
|
| 16 |
+
seed: 52345
|
| 17 |
+
use_lr_scheduler: true
|
| 18 |
+
lr_scheduler_kwargs:
|
| 19 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 20 |
+
warmup_duration: 10
|
| 21 |
+
update_every: 1
|
| 22 |
+
min_lr: 0.0001
|
| 23 |
+
gamma_decay: 0.98
|
| 24 |
+
loss_pose_type: l1
|
| 25 |
+
lr: 0.005
|
| 26 |
+
latent_size: 96
|
| 27 |
+
output_size: 3
|
| 28 |
+
z_activation: tanh
|
| 29 |
+
num_iter_perepoch: 580
|
| 30 |
+
obs_length: 30
|
| 31 |
+
prediction_horizon_train: 120
|
| 32 |
+
prediction_horizon_eval: 120
|
| 33 |
+
prediction_horizon: 120
|
| 34 |
+
pred_length: 120
|
| 35 |
+
prediction_horizon_train_min: 10
|
| 36 |
+
prediction_horizon_train_min_from_epoch: 200
|
| 37 |
+
curriculum_it: 10
|
| 38 |
+
random_prediction_horizon: true
|
| 39 |
+
if_consider_hip: false
|
| 40 |
+
history_sec: 0.5
|
| 41 |
+
prediction_horizon_sec: 2
|
| 42 |
+
motion_repr_type: SkeletonRescalePose
|
| 43 |
+
pose_box_size: 1.2
|
| 44 |
+
seq_centering: 0
|
| 45 |
+
task_name: hmp
|
| 46 |
+
num_joints: 22
|
| 47 |
+
fps: 60
|
| 48 |
+
multimodal_threshold: 0.4
|
| 49 |
+
dataset_type: AMASSDataset
|
| 50 |
+
dataset_name: amass
|
| 51 |
+
precomputed_folder: ./datasets/processed/AMASS/hmp
|
| 52 |
+
annotations_folder: ./datasets/annotations/AMASS/hmp
|
| 53 |
+
dtype: float32
|
| 54 |
+
data_loader_train:
|
| 55 |
+
stride: 60
|
| 56 |
+
augmentation: 30
|
| 57 |
+
shuffle: true
|
| 58 |
+
datasets:
|
| 59 |
+
- ACCAD
|
| 60 |
+
- BMLhandball
|
| 61 |
+
- BMLmovi
|
| 62 |
+
- BMLrub
|
| 63 |
+
- EKUT
|
| 64 |
+
- CMU
|
| 65 |
+
- EyesJapanDataset
|
| 66 |
+
- KIT
|
| 67 |
+
- PosePrior
|
| 68 |
+
- TCDHands
|
| 69 |
+
- TotalCapture
|
| 70 |
+
da_mirroring: 0.5
|
| 71 |
+
da_rotations: 1.0
|
| 72 |
+
drop_last: true
|
| 73 |
+
if_load_mmgt: false
|
| 74 |
+
data_loader_train_eval:
|
| 75 |
+
stride: 30
|
| 76 |
+
augmentation: 0
|
| 77 |
+
shuffle: false
|
| 78 |
+
datasets:
|
| 79 |
+
- ACCAD
|
| 80 |
+
- BMLhandball
|
| 81 |
+
- BMLmovi
|
| 82 |
+
- BMLrub
|
| 83 |
+
- EKUT
|
| 84 |
+
- CMU
|
| 85 |
+
- EyesJapanDataset
|
| 86 |
+
- KIT
|
| 87 |
+
- PosePrior
|
| 88 |
+
- TCDHands
|
| 89 |
+
- TotalCapture
|
| 90 |
+
da_mirroring: 0.0
|
| 91 |
+
da_rotations: 0.0
|
| 92 |
+
drop_last: false
|
| 93 |
+
if_load_mmgt: false
|
| 94 |
+
data_loader_valid:
|
| 95 |
+
stride: 30
|
| 96 |
+
augmentation: 0
|
| 97 |
+
shuffle: false
|
| 98 |
+
datasets:
|
| 99 |
+
- HumanEva
|
| 100 |
+
- HDM05
|
| 101 |
+
- SFU
|
| 102 |
+
- MoSh
|
| 103 |
+
file_idces: all
|
| 104 |
+
drop_last: false
|
| 105 |
+
if_load_mmgt: false
|
| 106 |
+
|
| 107 |
+
autoenc_arch:
|
| 108 |
+
enc_num_layers: 2
|
| 109 |
+
encoder_hidden_size: 96
|
| 110 |
+
decoder_hidden_size: 96
|
| 111 |
+
arch: AutoEncoder
|
| 112 |
+
recurrent_arch_enc: StaticGraphGRU
|
| 113 |
+
recurrent_arch_decoder: StaticGraphGRU
|
| 114 |
+
|
trained_models/hmp/amass/diffusion/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3412e0e99ec21641342a9997b6fdf1f9cd37211cdd79479a43a81ffd1e9820ec
|
| 3 |
+
size 643415447
|
trained_models/hmp/amass/diffusion/config.yaml
ADDED
|
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
if_resume_training: false
|
| 2 |
+
device: cuda
|
| 3 |
+
load: false
|
| 4 |
+
load_path: ''
|
| 5 |
+
dataset_main_path: ./datasets
|
| 6 |
+
dataset_annotation_path: ./datasets/annotations
|
| 7 |
+
dataset_precomputed_path: ./datasets/processed
|
| 8 |
+
output_log_path: ./trained_models/hmp/amass/diffusion
|
| 9 |
+
pretrained_autoencoder_path: ./trained_models/hmp/amass/autoencoder/checkpoints/cvpr_release.pt
|
| 10 |
+
lr: 0.001
|
| 11 |
+
diffusion_objective: pred_x0
|
| 12 |
+
weight_decay: 0.0
|
| 13 |
+
if_use_ema: true
|
| 14 |
+
step_start_ema: 100
|
| 15 |
+
ema_power: 0.6666666666666666
|
| 16 |
+
ema_update_every: 10
|
| 17 |
+
ema_min_value: 0.0
|
| 18 |
+
use_lr_scheduler: true
|
| 19 |
+
lr_scheduler_kwargs:
|
| 20 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 21 |
+
warmup_duration: 75
|
| 22 |
+
update_every: 2
|
| 23 |
+
min_lr: 0.0001
|
| 24 |
+
gamma_decay: 0.98
|
| 25 |
+
diffusion_conditioning: true
|
| 26 |
+
num_epochs: 150
|
| 27 |
+
num_workers: 4
|
| 28 |
+
batch_size: 64
|
| 29 |
+
batch_size_eval: 256
|
| 30 |
+
eval_frequency: 25
|
| 31 |
+
train_pick_best_sample_among_k: 50
|
| 32 |
+
similarity_space: input_space
|
| 33 |
+
diffusion_activation: identity
|
| 34 |
+
num_prob_samples: 50
|
| 35 |
+
diffusion_timesteps: 10
|
| 36 |
+
diffusion_type: NonisotropicGaussianDiffusion
|
| 37 |
+
diffusion_loss_type: snr
|
| 38 |
+
loss_reduction_type: l1
|
| 39 |
+
if_run_as_isotropic: false
|
| 40 |
+
if_sigma_n_scale: true
|
| 41 |
+
diffusion_covariance_type: skeleton-diffusion
|
| 42 |
+
gamma_scheduler: cosine
|
| 43 |
+
beta_schedule: cosine
|
| 44 |
+
sigma_n_scale: spectral
|
| 45 |
+
num_iter_perepoch: null
|
| 46 |
+
seed: 63485
|
| 47 |
+
diffusion_arch:
|
| 48 |
+
arch: Denoiser
|
| 49 |
+
use_attention: true
|
| 50 |
+
self_condition: false
|
| 51 |
+
norm_type: none
|
| 52 |
+
depth: 4
|
| 53 |
+
attn_dim_head: 32
|
| 54 |
+
attn_heads: 8
|
| 55 |
+
learn_influence: true
|
| 56 |
+
covariance_matrix_type: adjacency
|
trained_models/hmp/freeman/autoencoder/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8684cae605f16ec84bbad6e290c44b543fa88d76b39df4a851cbf8a99e9d5f91
|
| 3 |
+
size 15273931
|
trained_models/hmp/freeman/autoencoder/config.yaml
ADDED
|
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
dataset_main_path: ./datasets
|
| 2 |
+
dataset_annotation_path: ./datasets/annotations
|
| 3 |
+
dataset_precomputed_path: ./datasets/processed
|
| 4 |
+
if_resume_training: false
|
| 5 |
+
device: cuda
|
| 6 |
+
load: false
|
| 7 |
+
load_path: ''
|
| 8 |
+
output_log_path: ./trained_models/hmp/freeman/autoencoder
|
| 9 |
+
batch_size: 64
|
| 10 |
+
batch_size_eval: 512
|
| 11 |
+
if_run_validation: False
|
| 12 |
+
eval_frequency: 25
|
| 13 |
+
num_epochs: 200
|
| 14 |
+
num_iteration_eval: 10
|
| 15 |
+
num_workers: 4
|
| 16 |
+
seed: 52345
|
| 17 |
+
use_lr_scheduler: true
|
| 18 |
+
lr_scheduler_kwargs:
|
| 19 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 20 |
+
warmup_duration: 10
|
| 21 |
+
update_every: 1
|
| 22 |
+
min_lr: 0.0001
|
| 23 |
+
gamma_decay: 0.98
|
| 24 |
+
loss_pose_type: l1
|
| 25 |
+
lr: 0.005
|
| 26 |
+
latent_size: 96
|
| 27 |
+
output_size: 3
|
| 28 |
+
z_activation: tanh
|
| 29 |
+
num_iter_perepoch: 580
|
| 30 |
+
obs_length: 15
|
| 31 |
+
prediction_horizon_train: 60
|
| 32 |
+
prediction_horizon_eval: 60
|
| 33 |
+
prediction_horizon: 60
|
| 34 |
+
pred_length: 60
|
| 35 |
+
prediction_horizon_train_min: 10
|
| 36 |
+
prediction_horizon_train_min_from_epoch: 200
|
| 37 |
+
curriculum_it: 10
|
| 38 |
+
random_prediction_horizon: true
|
| 39 |
+
if_consider_hip: false
|
| 40 |
+
history_sec: 0.5
|
| 41 |
+
prediction_horizon_sec: 2
|
| 42 |
+
motion_repr_type: SkeletonRescalePose
|
| 43 |
+
pose_box_size: 1.5
|
| 44 |
+
seq_centering: 0
|
| 45 |
+
task_name: hmp
|
| 46 |
+
num_joints: 18
|
| 47 |
+
fps: 30
|
| 48 |
+
multimodal_threshold: 0.5
|
| 49 |
+
dataset_type: FreeManDataset
|
| 50 |
+
dataset_name: freeman
|
| 51 |
+
precomputed_folder: ./datasets/processed/FreeMan/hmp
|
| 52 |
+
annotations_folder: ./datasets/annotations/FreeMan/hmp
|
| 53 |
+
dtype: float32
|
| 54 |
+
data_loader_train:
|
| 55 |
+
stride: 10
|
| 56 |
+
augmentation: 5
|
| 57 |
+
shuffle: true
|
| 58 |
+
actions: all
|
| 59 |
+
da_mirroring: 0.5
|
| 60 |
+
da_rotations: 1.0
|
| 61 |
+
drop_last: true
|
| 62 |
+
if_load_mmgt: false
|
| 63 |
+
data_loader_train_eval:
|
| 64 |
+
stride: 30
|
| 65 |
+
augmentation: 0
|
| 66 |
+
shuffle: false
|
| 67 |
+
actions: all
|
| 68 |
+
da_mirroring: 0.0
|
| 69 |
+
da_rotations: 0.0
|
| 70 |
+
drop_last: false
|
| 71 |
+
if_load_mmgt: false
|
| 72 |
+
data_loader_valid:
|
| 73 |
+
stride: 30
|
| 74 |
+
augmentation: 0
|
| 75 |
+
shuffle: false
|
| 76 |
+
segments_path: ./datasets/annotations/FreeMan/hmp/segments_valid.csv
|
| 77 |
+
actions: all
|
| 78 |
+
drop_last: false
|
| 79 |
+
if_load_mmgt: false
|
| 80 |
+
|
| 81 |
+
autoenc_arch:
|
| 82 |
+
enc_num_layers: 1
|
| 83 |
+
encoder_hidden_size: 96
|
| 84 |
+
decoder_hidden_size: 96
|
| 85 |
+
arch: AutoEncoder
|
| 86 |
+
recurrent_arch_enc: StaticGraphGRU
|
| 87 |
+
recurrent_arch_decoder: StaticGraphGRU
|
trained_models/hmp/freeman/diffusion/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50dcf7bb231d0712f03baba0d761608352b97933c11b6c8f1d4091cc5dfcfa47
|
| 3 |
+
size 466423511
|
trained_models/hmp/freeman/diffusion/config.yaml
ADDED
|
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
if_resume_training: false
|
| 2 |
+
device: cuda
|
| 3 |
+
load: false
|
| 4 |
+
load_path: ''
|
| 5 |
+
dataset_main_path: ./datasets
|
| 6 |
+
dataset_annotation_path: ./datasets/annotations
|
| 7 |
+
dataset_precomputed_path: ./datasets/processed
|
| 8 |
+
output_log_path: ./trained_models/hmp/freeman/diffusion
|
| 9 |
+
pretrained_autoencoder_path: ./trained_models/hmp/freeman/autoencoder/checkpoints/cvpr_release.pt
|
| 10 |
+
lr: 0.001
|
| 11 |
+
diffusion_objective: pred_x0
|
| 12 |
+
weight_decay: 0.0
|
| 13 |
+
if_use_ema: true
|
| 14 |
+
step_start_ema: 100
|
| 15 |
+
ema_power: 0.6666666666666666
|
| 16 |
+
ema_update_every: 10
|
| 17 |
+
ema_min_value: 0.0
|
| 18 |
+
use_lr_scheduler: true
|
| 19 |
+
lr_scheduler_kwargs:
|
| 20 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 21 |
+
warmup_duration: 25
|
| 22 |
+
update_every: 5
|
| 23 |
+
min_lr: 0.0001
|
| 24 |
+
gamma_decay: 0.85
|
| 25 |
+
diffusion_conditioning: true
|
| 26 |
+
num_epochs: 200
|
| 27 |
+
num_workers: 4
|
| 28 |
+
batch_size: 64
|
| 29 |
+
batch_size_eval: 256
|
| 30 |
+
eval_frequency: 25
|
| 31 |
+
train_pick_best_sample_among_k: 50
|
| 32 |
+
similarity_space: input_space
|
| 33 |
+
diffusion_activation: identity
|
| 34 |
+
num_prob_samples: 50
|
| 35 |
+
diffusion_timesteps: 10
|
| 36 |
+
diffusion_type: NonisotropicGaussianDiffusion
|
| 37 |
+
diffusion_loss_type: snr
|
| 38 |
+
loss_reduction_type: l1
|
| 39 |
+
if_run_as_isotropic: false
|
| 40 |
+
if_sigma_n_scale: true
|
| 41 |
+
diffusion_covariance_type: skeleton-diffusion
|
| 42 |
+
gamma_scheduler: cosine
|
| 43 |
+
beta_schedule: cosine
|
| 44 |
+
sigma_n_scale: spectral
|
| 45 |
+
num_iter_perepoch: null
|
| 46 |
+
seed: 63485
|
| 47 |
+
diffusion_arch:
|
| 48 |
+
arch: Denoiser
|
| 49 |
+
use_attention: true
|
| 50 |
+
self_condition: false
|
| 51 |
+
norm_type: none
|
| 52 |
+
depth: 4
|
| 53 |
+
attn_dim_head: 32
|
| 54 |
+
attn_heads: 8
|
| 55 |
+
learn_influence: true
|
| 56 |
+
covariance_matrix_type: adjacency
|
trained_models/hmp/h36m/autoencoder/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:071937a8da740fa99a374a64e09f4ac4ab946a3025da3b7b271bc3bb4a7b3781
|
| 3 |
+
size 16956747
|
trained_models/hmp/h36m/autoencoder/config.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
dataset_main_path: ./datasets
|
| 2 |
+
dataset_annotation_path: ./datasets/annotations
|
| 3 |
+
dataset_precomputed_path: ./datasets/processed
|
| 4 |
+
if_resume_training: false
|
| 5 |
+
device: cuda
|
| 6 |
+
load: false
|
| 7 |
+
load_path: ''
|
| 8 |
+
output_log_path: ./trained_models/hmp/h36m/autoencoder
|
| 9 |
+
batch_size: 64
|
| 10 |
+
batch_size_eval: 512
|
| 11 |
+
if_run_validation: false
|
| 12 |
+
eval_frequency: 25
|
| 13 |
+
num_epochs: 200
|
| 14 |
+
num_iteration_eval: 10
|
| 15 |
+
num_workers: 4
|
| 16 |
+
seed: 52345
|
| 17 |
+
use_lr_scheduler: true
|
| 18 |
+
lr_scheduler_kwargs:
|
| 19 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 20 |
+
warmup_duration: 10
|
| 21 |
+
update_every: 1
|
| 22 |
+
min_lr: 0.0001
|
| 23 |
+
gamma_decay: 0.98
|
| 24 |
+
loss_pose_type: l1
|
| 25 |
+
lr: 0.005
|
| 26 |
+
latent_size: 96
|
| 27 |
+
output_size: 3
|
| 28 |
+
z_activation: tanh
|
| 29 |
+
num_iter_perepoch: 485
|
| 30 |
+
obs_length: 25
|
| 31 |
+
prediction_horizon_train: 100
|
| 32 |
+
prediction_horizon_eval: 100
|
| 33 |
+
prediction_horizon: 100
|
| 34 |
+
pred_length: 100
|
| 35 |
+
prediction_horizon_train_min: 10
|
| 36 |
+
prediction_horizon_train_min_from_epoch: 200
|
| 37 |
+
curriculum_it: 10
|
| 38 |
+
random_prediction_horizon: true
|
| 39 |
+
if_consider_hip: false
|
| 40 |
+
history_sec: 0.5
|
| 41 |
+
prediction_horizon_sec: 2
|
| 42 |
+
motion_repr_type: SkeletonRescalePose
|
| 43 |
+
pose_box_size: 1.5
|
| 44 |
+
seq_centering: 0
|
| 45 |
+
task_name: hmp
|
| 46 |
+
num_joints: 17
|
| 47 |
+
fps: 50
|
| 48 |
+
multimodal_threshold: 0.5
|
| 49 |
+
dataset_type: H36MDataset
|
| 50 |
+
dataset_name: h36m
|
| 51 |
+
precomputed_folder: ./datasets/processed/Human36M/hmp/
|
| 52 |
+
annotations_folder: ./datasets/annotations/Human36M/hmp
|
| 53 |
+
dtype: float32
|
| 54 |
+
data_loader_train:
|
| 55 |
+
stride: 10
|
| 56 |
+
augmentation: 5
|
| 57 |
+
shuffle: true
|
| 58 |
+
subjects:
|
| 59 |
+
- S1
|
| 60 |
+
- S5
|
| 61 |
+
- S6
|
| 62 |
+
- S7
|
| 63 |
+
- S8
|
| 64 |
+
actions: all
|
| 65 |
+
da_mirroring: 0.5
|
| 66 |
+
da_rotations: 1.0
|
| 67 |
+
drop_last: true
|
| 68 |
+
if_load_mmgt: false
|
| 69 |
+
data_loader_train_eval:
|
| 70 |
+
stride: 30
|
| 71 |
+
augmentation: 0
|
| 72 |
+
shuffle: false
|
| 73 |
+
subjects:
|
| 74 |
+
- S1
|
| 75 |
+
- S5
|
| 76 |
+
- S6
|
| 77 |
+
- S7
|
| 78 |
+
- S8
|
| 79 |
+
actions: all
|
| 80 |
+
da_mirroring: 0.0
|
| 81 |
+
da_rotations: 0.0
|
| 82 |
+
drop_last: false
|
| 83 |
+
if_load_mmgt: false
|
| 84 |
+
data_loader_valid:
|
| 85 |
+
stride: 30
|
| 86 |
+
augmentation: 0
|
| 87 |
+
shuffle: false
|
| 88 |
+
subjects:
|
| 89 |
+
- S8
|
| 90 |
+
segments_path: ./datasets/annotations/Human36M/hmp/segments_valid.csv
|
| 91 |
+
actions: all
|
| 92 |
+
drop_last: false
|
| 93 |
+
if_load_mmgt: false
|
| 94 |
+
|
| 95 |
+
|
| 96 |
+
autoenc_arch:
|
| 97 |
+
enc_num_layers: 1
|
| 98 |
+
encoder_hidden_size: 96
|
| 99 |
+
decoder_hidden_size: 96
|
| 100 |
+
arch: AutoEncoder
|
| 101 |
+
recurrent_arch_enc: StaticGraphGRU
|
| 102 |
+
recurrent_arch_decoder: StaticGraphGRU
|
trained_models/hmp/h36m/diffusion/checkpoints/cvpr_release.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48778f2d8d9dc03a9d25ca4d72a21c491a1d1a7e0ff7707cdacfd81f178cba3d
|
| 3 |
+
size 510561879
|
trained_models/hmp/h36m/diffusion/config.yaml
ADDED
|
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
if_resume_training: false
|
| 2 |
+
device: cuda
|
| 3 |
+
load: false
|
| 4 |
+
load_path: ''
|
| 5 |
+
dataset_main_path: ./datasets
|
| 6 |
+
dataset_annotation_path: ./datasets/annotations
|
| 7 |
+
dataset_precomputed_path: ./datasets/processed
|
| 8 |
+
output_log_path: ./trained_models/hmp/h36m/diffusion
|
| 9 |
+
pretrained_autoencoder_path: ./trained_models/hmp/h36m/autoencoder/checkpoints/cvpr_release.pt
|
| 10 |
+
lr: 0.001
|
| 11 |
+
diffusion_objective: pred_x0
|
| 12 |
+
weight_decay: 0.0
|
| 13 |
+
if_use_ema: true
|
| 14 |
+
step_start_ema: 100
|
| 15 |
+
ema_power: 0.6666666666666666
|
| 16 |
+
ema_update_every: 10
|
| 17 |
+
ema_min_value: 0.0
|
| 18 |
+
use_lr_scheduler: true
|
| 19 |
+
lr_scheduler_kwargs:
|
| 20 |
+
lr_scheduler_type: ExponentialLRSchedulerWarmup
|
| 21 |
+
warmup_duration: 25
|
| 22 |
+
update_every: 2
|
| 23 |
+
min_lr: 0.0001
|
| 24 |
+
gamma_decay: 0.85
|
| 25 |
+
diffusion_conditioning: true
|
| 26 |
+
num_epochs: 100
|
| 27 |
+
num_workers: 4
|
| 28 |
+
batch_size: 64
|
| 29 |
+
batch_size_eval: 256
|
| 30 |
+
eval_frequency: 25
|
| 31 |
+
train_pick_best_sample_among_k: 50
|
| 32 |
+
similarity_space: input_space
|
| 33 |
+
diffusion_activation: identity
|
| 34 |
+
num_prob_samples: 50
|
| 35 |
+
diffusion_timesteps: 10
|
| 36 |
+
diffusion_type: NonisotropicGaussianDiffusion
|
| 37 |
+
diffusion_loss_type: snr
|
| 38 |
+
loss_reduction_type: l1
|
| 39 |
+
if_run_as_isotropic: false
|
| 40 |
+
if_sigma_n_scale: true
|
| 41 |
+
diffusion_covariance_type: skeleton-diffusion
|
| 42 |
+
gamma_scheduler: cosine
|
| 43 |
+
beta_schedule: cosine
|
| 44 |
+
sigma_n_scale: spectral
|
| 45 |
+
num_iter_perepoch: null
|
| 46 |
+
seed: 63485
|
| 47 |
+
diffusion_arch:
|
| 48 |
+
arch: Denoiser
|
| 49 |
+
use_attention: true
|
| 50 |
+
self_condition: false
|
| 51 |
+
norm_type: none
|
| 52 |
+
depth: 4
|
| 53 |
+
attn_dim_head: 32
|
| 54 |
+
attn_heads: 8
|
| 55 |
+
learn_influence: true
|
| 56 |
+
covariance_matrix_type: adjacency
|