|
class CONFIG: |
|
gpus = "0,1" |
|
|
|
class TRAIN: |
|
batch_size = 90 |
|
lr = 1e-4 |
|
epochs = 150 |
|
workers = 12 |
|
val_split = 0.1 |
|
clipping_val = 1.0 |
|
patience = 3 |
|
factor = 0.5 |
|
|
|
|
|
class MODEL: |
|
enc_layers = 4 |
|
enc_in_dim = 384 |
|
enc_dim = 768 |
|
pred_dim = 512 |
|
pred_layers = 1 |
|
|
|
|
|
class DATA: |
|
dataset = 'vctk' |
|
''' |
|
Dictionary that specifies paths to root directories and train/test text files of each datasets. |
|
'root' is the path to the dataset and each line of the train.txt/test.txt files should contains the path to an |
|
audio file from 'root'. |
|
''' |
|
data_dir = {'vctk': {'root': 'data/vctk/wav48', |
|
'train': "data/vctk/train.txt", |
|
'test': "data/vctk/test.txt"}, |
|
} |
|
|
|
assert dataset in data_dir.keys(), 'Unknown dataset.' |
|
sr = 48000 |
|
audio_chunk_len = 122880 |
|
window_size = 960 |
|
stride = 480 |
|
|
|
class TRAIN: |
|
packet_sizes = [256, 512, 768, 960, 1024, |
|
1536] |
|
transition_probs = ((0.9, 0.1), (0.5, 0.1), (0.5, 0.5)) |
|
|
|
class EVAL: |
|
packet_size = 960 |
|
transition_probs = [(0.9, 0.1)] |
|
masking = 'gen' |
|
assert masking in ['gen', 'real'] |
|
trace_path = 'test_samples/blind/lossy_singals' |
|
|
|
class LOG: |
|
log_dir = 'lightning_logs' |
|
sample_path = 'audio_samples' |
|
|
|
class TEST: |
|
in_dir = 'test_samples/blind/lossy_signals' |
|
out_dir = 'test_samples/blind/lossy_signals_out' |
|
|