| DATASET: | |
| TRAIN_FILE_LIST: /apdcephfs_cq2/share_1290939/wenxuazhang/code/file_list/train.txt | |
| EVAL_FILE_LIST: /apdcephfs_cq2/share_1290939/wenxuazhang/code/file_list/val.txt | |
| TRAIN_BATCH_SIZE: 32 | |
| EVAL_BATCH_SIZE: 32 | |
| EXP: True | |
| EXP_DIM: 64 | |
| FRAME_LEN: 32 | |
| COEFF_LEN: 73 | |
| NUM_CLASSES: 46 | |
| AUDIO_ROOT_PATH: /apdcephfs_cq2/share_1290939/wenxuazhang/voxceleb1/wav | |
| COEFF_ROOT_PATH: /apdcephfs_cq2/share_1290939/wenxuazhang/voxceleb1/wav2lip_3dmm | |
| LMDB_PATH: /apdcephfs_cq2/share_1290939/shadowcun/datasets/VoxCeleb/v1/imdb | |
| DEBUG: True | |
| NUM_REPEATS: 2 | |
| T: 40 | |
| MODEL: | |
| FRAMEWORK: V2 | |
| AUDIOENCODER: | |
| LEAKY_RELU: True | |
| NORM: 'IN' | |
| DISCRIMINATOR: | |
| LEAKY_RELU: False | |
| INPUT_CHANNELS: 6 | |
| CVAE: | |
| AUDIO_EMB_IN_SIZE: 512 | |
| AUDIO_EMB_OUT_SIZE: 128 | |
| SEQ_LEN: 32 | |
| LATENT_SIZE: 256 | |
| ENCODER_LAYER_SIZES: [192, 1024] | |
| DECODER_LAYER_SIZES: [1024, 192] | |
| TRAIN: | |
| MAX_EPOCH: 300 | |
| GENERATOR: | |
| LR: 2.0e-5 | |
| DISCRIMINATOR: | |
| LR: 1.0e-5 | |
| LOSS: | |
| W_FEAT: 0 | |
| W_COEFF_EXP: 2 | |
| W_LM: 1.0e-2 | |
| W_LM_MOUTH: 0 | |
| W_REG: 0 | |
| W_SYNC: 0 | |
| W_COLOR: 0 | |
| W_EXPRESSION: 0 | |
| W_LIPREADING: 0.01 | |
| W_LIPREADING_VV: 0 | |
| W_EYE_BLINK: 4 | |
| TAG: | |
| NAME: small_dataset | |