File size: 306 Bytes
c9d0124 |
1 2 3 4 5 6 7 8 9 10 11 12 |
{
"tokenizer_class": "BertJapaneseTokenizer",
"do_lower_case": false,
"do_word_tokenize": true,
"do_subword_tokenize": true,
"word_tokenizer_type": "sudachi",
"subword_tokenizer_type": "wordpiece",
"model_max_length": 512,
"sudachi_kwargs": {"sudachi_split_mode":"A","sudachi_dict_type":"core"}
}
|