File size: 1,310 Bytes
f57d52a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 |
additional_config: null
allow_cache: true
best_model_criterion:
key: sys_SRCC
order: highest
collater_type: NonIntrusiveCollater
config: conf/ssl-mos-wav2vec2.yaml
dataset_type: NonIntrusiveDataset
dev_csv_path: data/bvcc_dev.csv
distributed: false
eval_and_save_interval_steps: 100
grad_norm: 1.0
inference_mode: mean_net
init_checkpoint: ''
keep_nbest_models: 5
listener_score_criterions: null
log_interval_steps: 100
mean_score_criterions:
- criterion_params:
masked_loss: false
order: 1
tau: 0.5
criterion_type: ScalarLoss
criterion_weight: 1.0
model_input: waveform
model_params:
mean_net_dnn_dim: 64
mean_net_output_type: scalar
mean_net_range_clipping: true
s3prl_name: wav2vec2
ssl_model_layer_idx: -1
ssl_model_output_dim: 768
ssl_module: s3prl
use_listener_modeling: false
use_mean_listener: false
model_type: SSLMOS
num_workers: 0
optimizer_params:
lr: 0.001
momentum: 0.9
optimizer_type: SGD
outdir: exp/ssl-mos-wav2vec2-3337
padding_mode: repetitive
patience: 20
pin_memory: true
rank: 0
resume: ''
sampling_rate: 16000
scheduler_type: null
seed: 3337
test_batch_size: 1
train_batch_size: 16
train_csv_path: data/bvcc_train.csv
train_max_steps: 100000
trainer_type: NonIntrusiveEstimatorTrainer
use_phoneme: false
verbose: 1
version: 0.1.0
wav_only: true
|