Naozumi0512 commited on
Commit
cc890f7
·
verified ·
1 Parent(s): 85ad847

Upload 4 files

Browse files
Files changed (4) hide show
  1. MONOPHONIC_CHARS.txt +0 -0
  2. POLYPHONIC_CHARS.txt +0 -0
  3. config.py +36 -0
  4. g2pw.onnx +3 -0
MONOPHONIC_CHARS.txt ADDED
The diff for this file is too large to render. See raw diff
 
POLYPHONIC_CHARS.txt ADDED
The diff for this file is too large to render. See raw diff
 
config.py ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ root = './rimeExtract_dataset/'
2
+
3
+ manual_seed = 1313
4
+ model_source = './bert-large-cantonese'
5
+ polyphonic_chars_path = root + 'POLYPHONIC_CHARS.txt'
6
+ window_size = 32
7
+ num_workers = 2
8
+ use_mask = True
9
+ use_conditional = True
10
+ param_conditional = {
11
+ 'bias': True,
12
+ 'char-linear': True,
13
+ 'pos-linear': False,
14
+ 'char+pos-second': True,
15
+ }
16
+
17
+ # for training
18
+ exp_name = 'rimeData_BERT_L_DescWS-Sec-cLin-B_POSw01'
19
+ train_sent_path = root + 'train.sent'
20
+ train_lb_path = root + 'train.lb'
21
+ valid_sent_path = root + 'dev.sent'
22
+ valid_lb_path = root + 'dev.lb'
23
+ test_sent_path = root + 'test.sent'
24
+ test_lb_path = root + 'test.lb'
25
+ batch_size = 128
26
+ lr = 5e-5
27
+ val_interval = 200
28
+ num_iter = 10000
29
+ use_pos = True
30
+ param_pos = {
31
+ 'weight': 0.1,
32
+ 'pos_joint_training': True,
33
+ 'train_pos_path': root + 'train.pos',
34
+ 'valid_pos_path': root + 'dev.pos',
35
+ 'test_pos_path': root + 'test.pos'
36
+ }
g2pw.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ad3c516e3edc373065279d3700b31699694828dc282afa18dcee429bff05d7
3
+ size 1840096049