File size: 302 Bytes
c640205
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
# English model
languages:  [
  "en"
]

# Model has 512 positional embeddings, but only trained on sequences up to 256 tokens
max_length: 256

# Not actually used, but included for pipeline generality
pre_labels: [
  "<NULL>",
  "¿",
]

post_labels: [
  "<NULL>",
  "<ACRONYM>",
  ".",
  ",",
  "?",
]