Spaces:
Running
on
A10G
Running
on
A10G
DATASET: | |
TRAIN_FILE_LIST: /apdcephfs_cq2/share_1290939/wenxuazhang/code/file_list/train.txt | |
EVAL_FILE_LIST: /apdcephfs_cq2/share_1290939/wenxuazhang/code/file_list/val.txt | |
TRAIN_BATCH_SIZE: 32 | |
EVAL_BATCH_SIZE: 32 | |
EXP: True | |
EXP_DIM: 64 | |
FRAME_LEN: 32 | |
COEFF_LEN: 73 | |
NUM_CLASSES: 46 | |
AUDIO_ROOT_PATH: /apdcephfs_cq2/share_1290939/wenxuazhang/voxceleb1/wav | |
COEFF_ROOT_PATH: /apdcephfs_cq2/share_1290939/wenxuazhang/voxceleb1/wav2lip_3dmm | |
LMDB_PATH: /apdcephfs_cq2/share_1290939/shadowcun/datasets/VoxCeleb/v1/imdb | |
DEBUG: True | |
NUM_REPEATS: 2 | |
T: 40 | |
MODEL: | |
FRAMEWORK: V2 | |
AUDIOENCODER: | |
LEAKY_RELU: True | |
NORM: 'IN' | |
DISCRIMINATOR: | |
LEAKY_RELU: False | |
INPUT_CHANNELS: 6 | |
CVAE: | |
AUDIO_EMB_IN_SIZE: 512 | |
AUDIO_EMB_OUT_SIZE: 128 | |
SEQ_LEN: 32 | |
LATENT_SIZE: 256 | |
ENCODER_LAYER_SIZES: [192, 1024] | |
DECODER_LAYER_SIZES: [1024, 192] | |
TRAIN: | |
MAX_EPOCH: 300 | |
GENERATOR: | |
LR: 2.0e-5 | |
DISCRIMINATOR: | |
LR: 1.0e-5 | |
LOSS: | |
W_FEAT: 0 | |
W_COEFF_EXP: 2 | |
W_LM: 1.0e-2 | |
W_LM_MOUTH: 0 | |
W_REG: 0 | |
W_SYNC: 0 | |
W_COLOR: 0 | |
W_EXPRESSION: 0 | |
W_LIPREADING: 0.01 | |
W_LIPREADING_VV: 0 | |
W_EYE_BLINK: 4 | |
TAG: | |
NAME: small_dataset | |