root = './rimeExtract_dataset/' manual_seed = 1313 model_source = './bert-base-cantonese' polyphonic_chars_path = root + 'POLYPHONIC_CHARS.txt' window_size = 32 num_workers = 2 use_mask = True use_conditional = True param_conditional = { 'bias': True, 'char-linear': True, 'pos-linear': False, 'char+pos-second': True, } # for training exp_name = '20241206_BERT_B_DescWS-Sec-cLin-B_POS_hkcancor_w03' train_sent_path = root + 'train.sent' train_lb_path = root + 'train.lb' valid_sent_path = root + 'dev.sent' valid_lb_path = root + 'dev.lb' test_sent_path = root + 'test.sent' test_lb_path = root + 'test.lb' batch_size = 128 lr = 5e-5 val_interval = 200 num_iter = 13000 use_pos = True param_pos = { 'weight': 0.3, 'pos_joint_training': True, # 'train_pos_path': root + 'train.pos', # 'valid_pos_path': root + 'dev.pos', # 'test_pos_path': root + 'test.pos', 'train_pos_path': root + 'train_hkcancor.pos', 'valid_pos_path': root + 'dev_hkcancor.pos', 'test_pos_path': root + 'test_hkcancor.pos', }