1-800-BAD-CODE commited on
Commit
c640205
1 Parent(s): ce426d6

Create config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +21 -0
config.yaml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # English model
2
+ languages: [
3
+ "en"
4
+ ]
5
+
6
+ # Model has 512 positional embeddings, but only trained on sequences up to 256 tokens
7
+ max_length: 256
8
+
9
+ # Not actually used, but included for pipeline generality
10
+ pre_labels: [
11
+ "<NULL>",
12
+ "¿",
13
+ ]
14
+
15
+ post_labels: [
16
+ "<NULL>",
17
+ "<ACRONYM>",
18
+ ".",
19
+ ",",
20
+ "?",
21
+ ]