Naozumi0512 commited on
Commit
bea4509
·
verified ·
1 Parent(s): fe708ee

Upload 4 files

Browse files
Files changed (4) hide show
  1. MONOPHONIC_CHARS.txt +0 -0
  2. POLYPHONIC_CHARS.txt +0 -0
  3. config.py +37 -0
  4. g2pw.onnx +3 -0
MONOPHONIC_CHARS.txt ADDED
The diff for this file is too large to render. See raw diff
 
POLYPHONIC_CHARS.txt ADDED
The diff for this file is too large to render. See raw diff
 
config.py ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # root = './20241128-rimePure-zjyg/'
2
+ root = './rimeExtract_dataset/'
3
+
4
+ manual_seed = 1313
5
+ model_source = './bert-base-cantonese'
6
+ polyphonic_chars_path = root + 'POLYPHONIC_CHARS.txt'
7
+ window_size = 32
8
+ num_workers = 2
9
+ use_mask = True
10
+ use_conditional = True
11
+ param_conditional = {
12
+ 'bias': True,
13
+ 'char-linear': True,
14
+ 'pos-linear': False,
15
+ 'char+pos-second': True,
16
+ }
17
+
18
+ # for training
19
+ exp_name = '20241201_BERT_B_DescWS-Sec-cLin-B_POSw01'
20
+ train_sent_path = root + 'train.sent'
21
+ train_lb_path = root + 'train.lb'
22
+ valid_sent_path = root + 'dev.sent'
23
+ valid_lb_path = root + 'dev.lb'
24
+ test_sent_path = root + 'test.sent'
25
+ test_lb_path = root + 'test.lb'
26
+ batch_size = 128
27
+ lr = 5e-5
28
+ val_interval = 200
29
+ num_iter = 13000
30
+ use_pos = True
31
+ param_pos = {
32
+ 'weight': 0.1,
33
+ 'pos_joint_training': True,
34
+ 'train_pos_path': root + 'train.pos',
35
+ 'valid_pos_path': root + 'dev.pos',
36
+ 'test_pos_path': root + 'test.pos'
37
+ }
g2pw.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c751a9b76c3b0f90fb9077aa1fc97215cab44d05d6cd35244a54a2a1ad35009
3
+ size 941756575