File size: 302 Bytes
c640205 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 |
# English model
languages: [
"en"
]
# Model has 512 positional embeddings, but only trained on sequences up to 256 tokens
max_length: 256
# Not actually used, but included for pipeline generality
pre_labels: [
"<NULL>",
"¿",
]
post_labels: [
"<NULL>",
"<ACRONYM>",
".",
",",
"?",
] |