chengdongliang commited on
Commit
de9250c
1 Parent(s): cbe68d6

upload model.pt

Browse files
Files changed (2) hide show
  1. avg_model.pt +3 -0
  2. config.yaml +88 -0
avg_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:527cbf6b82c338bac1fda70004bdd26a08bdc04972977a1f9fbd4870f7a85411
3
+ size 45084229
config.yaml ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ checkpoint: exp/Gemini_DF_ResNet114-TSTP-emb256-fbank80-num_frms200-aug0.6-spTrue-saFalse-ArcMargin-AdamW-epoch165-LM/models/model_0.pt
2
+ data_type: shard
3
+ dataloader_args:
4
+ batch_size: 32
5
+ drop_last: true
6
+ num_workers: 8
7
+ pin_memory: false
8
+ prefetch_factor: 8
9
+ dataset_args:
10
+ aug_prob: 0.6
11
+ fbank_args:
12
+ dither: 1.0
13
+ frame_length: 25
14
+ frame_shift: 10
15
+ num_mel_bins: 80
16
+ filter: true
17
+ filter_args:
18
+ max_num_frames: 800
19
+ min_num_frames: 100
20
+ num_frms: 600
21
+ resample_rate: 16000
22
+ sample_num_per_epoch: 0
23
+ shuffle: true
24
+ shuffle_args:
25
+ shuffle_size: 2500
26
+ spec_aug: false
27
+ spec_aug_args:
28
+ max_f: 8
29
+ max_t: 10
30
+ num_f_mask: 1
31
+ num_t_mask: 1
32
+ prob: 0.6
33
+ speed_perturb: false
34
+ do_lm: true
35
+ enable_amp: false
36
+ exp_dir: exp/Gemini_DF_ResNet114-TSTP-emb256-fbank80-num_frms200-aug0.6-spTrue-saFalse-ArcMargin-AdamW-epoch165-LM
37
+ gpus:
38
+ - 0
39
+ - 1
40
+ log_batch_interval: 100
41
+ loss: CrossEntropyLoss
42
+ loss_args: {}
43
+ margin_scheduler: MarginScheduler
44
+ margin_update:
45
+ epoch_iter: 17062
46
+ final_margin: 0.5
47
+ fix_start_epoch: 1
48
+ increase_start_epoch: 1
49
+ increase_type: exp
50
+ initial_margin: 0.5
51
+ update_margin: true
52
+ model: Gemini_DF_ResNet114
53
+ model_args:
54
+ embed_dim: 256
55
+ feat_dim: 80
56
+ pooling_func: TSTP
57
+ two_emb_layer: false
58
+ model_init: null
59
+ noise_data: /data/VoxForWe/musan/lmdb
60
+ num_avg: 1
61
+ num_epochs: 5
62
+ optimizer: SGD
63
+ optimizer_args:
64
+ lr: 0.0001
65
+ momentum: 0.9
66
+ nesterov: true
67
+ weight_decay: 0.0001
68
+ projection_args:
69
+ do_lm: true
70
+ easy_margin: false
71
+ embed_dim: 256
72
+ num_class: 17982
73
+ project_type: arc_margin
74
+ scale: 32.0
75
+ reverb_data: /data/VoxForWe/rirs/lmdb
76
+ save_epoch_interval: 1
77
+ scheduler: ExponentialDecrease
78
+ scheduler_args:
79
+ epoch_iter: 17062
80
+ final_lr: 2.5e-05
81
+ initial_lr: 0.0001
82
+ num_epochs: 5
83
+ scale_ratio: 1.0
84
+ warm_from_zero: true
85
+ warm_up_epoch: 1
86
+ seed: 42
87
+ train_data: /data/VoxForWe/vox2_dev/shard.list
88
+ train_label: /data/VoxForWe/vox2_dev/utt2spk