File size: 702 Bytes
6d737a4
 
 
 
 
 
 
 
 
 
3d5de11
031e5e2
90a23dc
7cf274a
 
 
 
 
a4a574a
 
 
 
 
 
 
 
 
 
06e9e3b
 
 
 
 
 
 
 
 
 
031e5e2
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
[preprocessing]
THRESHOLD = 0.50
MODEL = garbage
SPLIT_BY = word
REMOVE_PUNC = 0
SPLIT_LENGTH = 60
SPLIT_OVERLAP = 10
RESPECT_SENTENCE_BOUNDARY = 1
TOP_KEY = 10

[tapp]
THRESHOLD = 0.50
MODEL = GIZ/TAPP-multilabel-bge_f
SPLIT_BY = word
REMOVE_PUNC = 0
SPLIT_LENGTH = 60
SPLIT_OVERLAP = 10
RESPECT_SENTENCE_BOUNDARY = 1
TOP_KEY = 10

[adapmit] #updated
THRESHOLD = 0.50
MODEL = GIZ/ADAPMIT-multilabel-bge_f
SPLIT_BY = word
REMOVE_PUNC = 0
SPLIT_LENGTH = 60
SPLIT_OVERLAP = 10
RESPECT_SENTENCE_BOUNDARY = 1
TOP_KEY = 10

[sector] # updated
THRESHOLD = 0.50
MODEL = GIZ/SECTOR-multilabel-bge_f
SPLIT_BY = word
REMOVE_PUNC = 0
SPLIT_LENGTH = 60
SPLIT_OVERLAP = 10
RESPECT_SENTENCE_BOUNDARY = 1
TOP_KEY = 10