File size: 306 Bytes
c9d0124
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
{
 "tokenizer_class": "BertJapaneseTokenizer",
 "do_lower_case": false,
 "do_word_tokenize": true,
 "do_subword_tokenize": true,
 "word_tokenizer_type": "sudachi",
 "subword_tokenizer_type": "wordpiece",
 "model_max_length": 512,
 "sudachi_kwargs": {"sudachi_split_mode":"A","sudachi_dict_type":"core"}
}