{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 1, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 2, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 3, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 4, "content": "[UNK]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 5, "content": "", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "BertNormalizer", "clean_text": true, "handle_chinese_chars": true, "strip_accents": null, "lowercase": true }, "pre_tokenizer": { "type": "BertPreTokenizer" }, "post_processor": { "type": "RobertaProcessing", "sep": [ "", 2 ], "cls": [ "", 0 ], "trim_offsets": true, "add_prefix_space": false }, "decoder": { "type": "WordPiece", "prefix": "##", "cleanup": true }, "model": { "type": "WordPiece", "unk_token": "[UNK]", "continuing_subword_prefix": "##", "max_input_chars_per_word": 100, "vocab": { "": 0, "": 1, "": 2, "": 3, "[UNK]": 4, "": 5, "!": 6, "\"": 7, "#": 8, "$": 9, "%": 10, "&": 11, "'": 12, "(": 13, ")": 14, "*": 15, "+": 16, ",": 17, "-": 18, ".": 19, "/": 20, "0": 21, "1": 22, "2": 23, "3": 24, "4": 25, "5": 26, "6": 27, "7": 28, "8": 29, "9": 30, ":": 31, ";": 32, "<": 33, "=": 34, ">": 35, "?": 36, "@": 37, "[": 38, "\\": 39, "]": 40, "^": 41, "_": 42, "`": 43, "a": 44, "b": 45, "c": 46, "d": 47, "e": 48, "f": 49, "g": 50, "h": 51, "i": 52, "j": 53, "k": 54, "l": 55, "m": 56, "n": 57, "o": 58, "p": 59, "q": 60, "r": 61, "s": 62, "t": 63, "u": 64, "v": 65, "w": 66, "x": 67, "y": 68, "z": 69, "|": 70, "}": 71, "~": 72, "¡": 73, "¢": 74, "£": 75, "¥": 76, "§": 77, "°": 78, "±": 79, "²": 80, "³": 81, "´": 82, "µ": 83, "·": 84, "º": 85, "½": 86, "¿": 87, "×": 88, "ß": 89, "æ": 90, "ð": 91, "ø": 92, "þ": 93, "đ": 94, "ħ": 95, "ı": 96, "ł": 97, "œ": 98, "ɐ": 99, "ɑ": 100, "ɒ": 101, "ɔ": 102, "ə": 103, "ɛ": 104, "ɜ": 105, "ɡ": 106, "ɢ": 107, "ɪ": 108, "ɫ": 109, "ɳ": 110, "ɽ": 111, "ɾ": 112, "ʁ": 113, "ʃ": 114, "ʊ": 115, "ʋ": 116, "ʒ": 117, "ʔ": 118, "ʕ": 119, "ʲ": 120, "ʻ": 121, "ʼ": 122, "ʾ": 123, "ʿ": 124, "ˈ": 125, "ˌ": 126, "ː": 127, "α": 128, "β": 129, "γ": 130, "δ": 131, "ε": 132, "η": 133, "θ": 134, "ι": 135, "κ": 136, "λ": 137, "μ": 138, "ν": 139, "ξ": 140, "ο": 141, "π": 142, "ρ": 143, "ς": 144, "σ": 145, "τ": 146, "υ": 147, "φ": 148, "χ": 149, "ψ": 150, "ω": 151, "а": 152, "б": 153, "в": 154, "г": 155, "д": 156, "е": 157, "ж": 158, "з": 159, "и": 160, "к": 161, "л": 162, "м": 163, "н": 164, "о": 165, "п": 166, "р": 167, "с": 168, "т": 169, "у": 170, "х": 171, "ц": 172, "ш": 173, "ъ": 174, "ы": 175, "ь": 176, "ю": 177, "я": 178, "є": 179, "א": 180, "ב": 181, "ג": 182, "ה": 183, "ו": 184, "ז": 185, "ח": 186, "י": 187, "ל": 188, "ם": 189, "מ": 190, "ן": 191, "נ": 192, "ס": 193, "ף": 194, "פ": 195, "צ": 196, "ר": 197, "ש": 198, "ת": 199, "ء": 200, "ا": 201, "ب": 202, "ة": 203, "ت": 204, "ث": 205, "ج": 206, "ح": 207, "خ": 208, "د": 209, "ذ": 210, "ر": 211, "س": 212, "ش": 213, "ص": 214, "ع": 215, "ف": 216, "ق": 217, "ك": 218, "ل": 219, "م": 220, "ن": 221, "ه": 222, "و": 223, "ي": 224, "ܐ": 225, "ܕ": 226, "ܗ": 227, "ܝ": 228, "ܠ": 229, "ܢ": 230, "ܬ": 231, "अ": 232, "ई": 233, "क": 234, "ग": 235, "ण": 236, "त": 237, "द": 238, "न": 239, "प": 240, "ब": 241, "म": 242, "य": 243, "र": 244, "ल": 245, "व": 246, "स": 247, "ह": 248, "ा": 249, "ि": 250, "আ": 251, "ল": 252, "হ": 253, "া": 254, "ਅ": 255, "ਲ": 256, "ਹ": 257, "ਾ": 258, "അ": 259, "ള": 260, "ഹ": 261, "ാ": 262, "ก": 263, "ค": 264, "ง": 265, "ช": 266, "ซ": 267, "ญ": 268, "ฐ": 269, "ณ": 270, "ด": 271, "ต": 272, "น": 273, "บ": 274, "ป": 275, "พ": 276, "ภ": 277, "ม": 278, "ย": 279, "ร": 280, "ล": 281, "ว": 282, "ศ": 283, "ษ": 284, "ส": 285, "ห": 286, "อ": 287, "ฮ": 288, "ะ": 289, "า": 290, "เ": 291, "แ": 292, "ไ": 293, "ა": 294, "ბ": 295, "გ": 296, "დ": 297, "ე": 298, "ვ": 299, "ზ": 300, "თ": 301, "ი": 302, "კ": 303, "ლ": 304, "მ": 305, "ნ": 306, "ო": 307, "პ": 308, "ჟ": 309, "რ": 310, "ს": 311, "ტ": 312, "უ": 313, "ფ": 314, "ქ": 315, "ღ": 316, "ყ": 317, "შ": 318, "ჩ": 319, "ც": 320, "ძ": 321, "წ": 322, "ჭ": 323, "ხ": 324, "ჯ": 325, "ჰ": 326, "ჱ": 327, "ჲ": 328, "ჳ": 329, "ჴ": 330, "ჵ": 331, "ჶ": 332, "ჷ": 333, "ჸ": 334, "ჹ": 335, "ჺ": 336, "჻": 337, "ᄃ": 338, "ᄅ": 339, "ᄇ": 340, "ᄋ": 341, "ᄌ": 342, "ᅡ": 343, "ᅢ": 344, "ᅦ": 345, "ᅧ": 346, "ᅩ": 347, "ᅮ": 348, "ᅵ": 349, "ᆨ": 350, "ᆫ": 351, "ᆯ": 352, "ᆸ": 353, "ᆼ": 354, "ᵻ": 355, "‐": 356, "‑": 357, "–": 358, "—": 359, "―": 360, "‘": 361, "’": 362, "“": 363, "”": 364, "„": 365, "†": 366, "‡": 367, "•": 368, "…": 369, "′": 370, "″": 371, "⁄": 372, "₣": 373, "₤": 374, "€": 375, "₹": 376, "⅓": 377, "⅔": 378, "→": 379, "−": 380, "≡": 381, "≤": 382, "①": 383, "☉": 384, "☫": 385, "♀": 386, "♭": 387, "♯": 388, "⚳": 389, "ⴀ": 390, "ⴂ": 391, "ⴃ": 392, "ⴈ": 393, "ⴌ": 394, "ⴕ": 395, "ⴟ": 396, "〈": 397, "〉": 398, "〜": 399, "あ": 400, "い": 401, "う": 402, "お": 403, "か": 404, "き": 405, "く": 406, "け": 407, "こ": 408, "さ": 409, "し": 410, "す": 411, "せ": 412, "た": 413, "ち": 414, "っ": 415, "つ": 416, "と": 417, "な": 418, "に": 419, "の": 420, "は": 421, "ひ": 422, "ふ": 423, "ほ": 424, "ま": 425, "み": 426, "め": 427, "も": 428, "ゃ": 429, "ゆ": 430, "ょ": 431, "ら": 432, "り": 433, "る": 434, "れ": 435, "わ": 436, "を": 437, "ん": 438, "ァ": 439, "ア": 440, "ィ": 441, "イ": 442, "ゥ": 443, "ウ": 444, "ェ": 445, "エ": 446, "ォ": 447, "オ": 448, "カ": 449, "キ": 450, "ク": 451, "ケ": 452, "コ": 453, "サ": 454, "シ": 455, "ス": 456, "セ": 457, "タ": 458, "チ": 459, "ッ": 460, "ツ": 461, "テ": 462, "ト": 463, "ナ": 464, "ニ": 465, "ネ": 466, "ノ": 467, "ハ": 468, "フ": 469, "ヘ": 470, "マ": 471, "ミ": 472, "ム": 473, "モ": 474, "ャ": 475, "ュ": 476, "ョ": 477, "ラ": 478, "リ": 479, "ル": 480, "レ": 481, "ロ": 482, "ン": 483, "・": 484, "ー": 485, "一": 486, "七": 487, "下": 488, "世": 489, "丙": 490, "中": 491, "主": 492, "乃": 493, "之": 494, "乙": 495, "九": 496, "二": 497, "云": 498, "人": 499, "今": 500, "付": 501, "作": 502, "侗": 503, "依": 504, "信": 505, "傳": 506, "儚": 507, "充": 508, "光": 509, "全": 510, "兵": 511, "其": 512, "具": 513, "円": 514, "再": 515, "出": 516, "判": 517, "前": 518, "剛": 519, "劇": 520, "劉": 521, "動": 522, "化": 523, "北": 524, "华": 525, "厂": 526, "去": 527, "古": 528, "可": 529, "台": 530, "史": 531, "同": 532, "名": 533, "君": 534, "吳": 535, "周": 536, "命": 537, "和": 538, "咲": 539, "善": 540, "四": 541, "國": 542, "園": 543, "圣": 544, "在": 545, "坂": 546, "堤": 547, "場": 548, "塘": 549, "夕": 550, "大": 551, "天": 552, "夫": 553, "女": 554, "妙": 555, "姚": 556, "子": 557, "孟": 558, "守": 559, "安": 560, "宋": 561, "完": 562, "宗": 563, "宝": 564, "宫": 565, "寝": 566, "寺": 567, "小": 568, "少": 569, "尾": 570, "山": 571, "岳": 572, "川": 573, "州": 574, "巳": 575, "市": 576, "師": 577, "平": 578, "广": 579, "庆": 580, "府": 581, "座": 582, "廬": 583, "建": 584, "式": 585, "張": 586, "彌": 587, "彩": 588, "彼": 589, "後": 590, "御": 591, "德": 592, "思": 593, "愛": 594, "憑": 595, "憶": 596, "應": 597, "懷": 598, "战": 599, "戦": 600, "扈": 601, "技": 602, "拉": 603, "拳": 604, "挑": 605, "揺": 606, "攻": 607, "放": 608, "政": 609, "散": 610, "斯": 611, "方": 612, "日": 613, "旦": 614, "旭": 615, "昌": 616, "明": 617, "星": 618, "春": 619, "晋": 620, "景": 621, "曦": 622, "月": 623, "望": 624, "未": 625, "本": 626, "李": 627, "村": 628, "杜": 629, "束": 630, "来": 631, "林": 632, "桜": 633, "梶": 634, "棘": 635, "椎": 636, "楊": 637, "楚": 638, "榮": 639, "橘": 640, "機": 641, "正": 642, "殻": 643, "殿": 644, "母": 645, "水": 646, "汉": 647, "沂": 648, "沙": 649, "河": 650, "泗": 651, "波": 652, "泣": 653, "洪": 654, "淹": 655, "清": 656, "湯": 657, "漢": 658, "澄": 659, "澤": 660, "火": 661, "灯": 662, "灵": 663, "灼": 664, "焼": 665, "熱": 666, "物": 667, "狐": 668, "狸": 669, "玄": 670, "王": 671, "玩": 672, "珂": 673, "珙": 674, "球": 675, "理": 676, "琦": 677, "琪": 678, "瓊": 679, "生": 680, "田": 681, "畢": 682, "番": 683, "瘡": 684, "白": 685, "皮": 686, "真": 687, "砲": 688, "礮": 689, "祈": 690, "神": 691, "祠": 692, "秋": 693, "空": 694, "立": 695, "精": 696, "約": 697, "絵": 698, "織": 699, "義": 700, "翠": 701, "者": 702, "耕": 703, "肖": 704, "胡": 705, "膀": 706, "臂": 707, "興": 708, "良": 709, "花": 710, "芳": 711, "芽": 712, "若": 713, "英": 714, "藕": 715, "藥": 716, "蘄": 717, "蘇": 718, "行": 719, "裁": 720, "規": 721, "覺": 722, "观": 723, "解": 724, "記": 725, "誓": 726, "誡": 727, "誰": 728, "謎": 729, "许": 730, "谭": 731, "豪": 732, "豫": 733, "費": 734, "贵": 735, "赤": 736, "趙": 737, "足": 738, "跡": 739, "転": 740, "辛": 741, "逆": 742, "遇": 743, "運": 744, "過": 745, "遠": 746, "選": 747, "邦": 748, "邱": 749, "部": 750, "郭": 751, "都": 752, "酈": 753, "里": 754, "野": 755, "金": 756, "銃": 757, "鋼": 758, "錄": 759, "錡": 760, "鍵": 761, "鐵": 762, "钱": 763, "铁": 764, "關": 765, "防": 766, "阿": 767, "陈": 768, "陳": 769, "陽": 770, "隊": 771, "階": 772, "集": 773, "雪": 774, "雲": 775, "霖": 776, "霹": 777, "靂": 778, "韓": 779, "願": 780, "顯": 781, "颜": 782, "马": 783, "高": 784, "龍": 785, "ﷲ": 786, "ﻋ": 787, "/": 788, "3": 789, "~": 790, "##r": 791, "##o": 792, "##s": 793, "##z": 794, "##i": 795, "##e": 796, "##c": 797, "##p": 798, "##h": 799, "##l": 800, "##a": 801, "##f": 802, "##t": 803, "##n": 804, "##k": 805, "##m": 806, "##d": 807, "##u": 808, "##b": 809, "##y": 810, "##7": 811, "##v": 812, "##g": 813, "##5": 814, "##0": 815, "##6": 816, "##9": 817, "##4": 818, "##υ": 819, "##є": 820, "##λ": 821, "##ο": 822, "##ς": 823, "##8": 824, "##j": 825, "##ø": 826, "##ß": 827, "##α": 828, "##w": 829, "##2": 830, "##1": 831, "##3": 832, "##ł": 833, "##β": 834, "##x": 835, "##რ": 836, "##გ": 837, "##ვ": 838, "##ლ": 839, "##ო": 840, "##ა": 841, "##ნ": 842, "##ი": 843, "##q": 844, "##ュ": 845, "##ナ": 846, "##ミ": 847, "##ス": 848, "##ォ": 849, "##ル": 850, "##ト": 851, "##ゥ": 852, "##フ": 853, "##ل": 854, "##ا": 855, "##ب": 856, "##ː": 857, "##ɒ": 858, "##っ": 859, "##მ": 860, "##ე": 861, "##æ": 862, "##お": 863, "##り": 864, "##γ": 865, "##ρ": 866, "##ə": 867, "##か": 868, "##な": 869, "##た": 870, "##は": 871, "##め": 872, "##წ": 873, "##ფ": 874, "##δ": 875, "##μ": 876, "##ε": 877, "##ι": 878, "##つ": 879, "##đ": 880, "##о": 881, "##с": 882, "##п": 883, "##д": 884, "##н": 885, "##е": 886, "##ხ": 887, "##დ": 888, "##ハ": 889, "##エ": 890, "##タ": 891, "##テ": 892, "##イ": 893, "##く": 894, "##ん": 895, "##ー": 896, "##ю": 897, "##з": 898, "##ป": 899, "##ย": 900, "##ر": 901, "##ث": 902, "##م": 903, "##د": 904, "##ウ": 905, "##ァ": 906, "##キ": 907, "##リ": 908, "##ア": 909, "##3": 910, "##ს": 911, "##あ": 912, "##ल": 913, "##ʻ": 914, "##ノ": 915, "##พ": 916, "##ร": 917, "##ص": 918, "##ن": 919, "##р": 920, "##и": 921, "##т": 922, "##ɑ": 923, "##ω": 924, "##ν": 925, "##ı": 926, "##უ": 927, "##ც": 928, "##ه": 929, "##а": 930, "##в": 931, "##к": 932, "##ˈ": 933, "##ɳ": 934, "##ɛ": 935, "##ʊ": 936, "##τ": 937, "##κ": 938, "##ɐ": 939, "##ɽ": 940, "##თ": 941, "##ɪ": 942, "##こ": 943, "##の": 944, "##ב": 945, "##ת": 946, "##א": 947, "##י": 948, "##л": 949, "##у": 950, "##я": 951, "##ਲ": 952, "##ਹ": 953, "##ツ": 954, "##ネ": 955, "##ा": 956, "##ह": 957, "##ค": 958, "##ว": 959, "##ต": 960, "##ʿ": 961, "##ਾ": 962, "##ʃ": 963, "##س": 964, "##ت": 965, "##แ": 966, "##ก": 967, "##し": 968, "##す": 969, "##き": 970, "##ひ": 971, "##と": 972, "##ɡ": 973, "##ল": 974, "##ण": 975, "##स": 976, "##न": 977, "##ʒ": 978, "##ტ": 979, "##ჱ": 980, "##ภ": 981, "##า": 982, "##ด": 983, "##ラ": 984, "##ッ": 985, "##シ": 986, "##を": 987, "##ל": 988, "##ה": 989, "##ן": 990, "##σ": 991, "##ш": 992, "##ъ": 993, "##ו": 994, "##פ": 995, "##ซ": 996, "##う": 997, "##ィ": 998, "##ы": 999, "##ي": 1000, "##ン": 1001, "##カ": 1002, "##ई": 1003, "##ჳ": 1004, "##ᵻ": 1005, "##ɾ": 1006, "##ʲ": 1007, "##ク": 1008, "##サ": 1009, "##г": 1010, "##ᅡ": 1011, "##ᆯ": 1012, "##ᄅ": 1013, "##ロ": 1014, "##η": 1015, "##ら": 1016, "##θ": 1017, "##ɔ": 1018, "##ล": 1019, "##อ": 1020, "##ฮ": 1021, "##χ": 1022, "##ɜ": 1023, "##ר": 1024, "##ם": 1025, "##º": 1026, "##र": 1027, "##れ": 1028, "##る": 1029, "##い": 1030, "##ะ": 1031, "##ช": 1032, "##น": 1033, "##ェ": 1034, "##レ": 1035, "##ニ": 1036, "##ف": 1037, "##ц": 1038, "##ь": 1039, "##ณ": 1040, "##ม": 1041, "##м": 1042, "##द": 1043, "##π": 1044, "##ش": 1045, "##و": 1046, "##خ": 1047, "##ʔ": 1048, "##ム": 1049, "##チ": 1050, "##ع": 1051, "##ة": 1052, "##נ": 1053, "##ち": 1054, "##ゃ": 1055, "##み": 1056, "##ء": 1057, "##व": 1058, "##ξ": 1059, "##ョ": 1060, "##ᄇ": 1061, "##ᅮ": 1062, "##ᄃ": 1063, "##ᅢ": 1064, "##ᅦ": 1065, "##ᅩ": 1066, "##ᆨ": 1067, "##ᅵ": 1068, "##ᆸ": 1069, "##ᅧ": 1070, "##ᆼ": 1071, "##ᄋ": 1072, "##ᆫ": 1073, "##ق": 1074, "##ि": 1075, "##ग": 1076, "##ψ": 1077, "##ง": 1078, "##ไ": 1079, "##ʁ": 1080, "##せ": 1081, "##ള": 1082, "##ح": 1083, "##マ": 1084, "##ˌ": 1085, "##ャ": 1086, "##モ": 1087, "##ჲ": 1088, "##ð": 1089, "##œ": 1090, "##ま": 1091, "##ܕ": 1092, "##ܝ": 1093, "##ܢ": 1094, "##ܬ": 1095, "##ാ": 1096, "##ഹ": 1097, "##х": 1098, "##セ": 1099, "##オ": 1100, "##も": 1101, "##ж": 1102, "##ף": 1103, "##ょ": 1104, "##に": 1105, "##ש": 1106, "##מ": 1107, "##צ": 1108, "##ذ": 1109, "##ゆ": 1110, "##ษ": 1111, "##ฐ": 1112, "##ك": 1113, "##া": 1114, "##হ": 1115, "##क": 1116, "##ܠ": 1117, "##ܗ": 1118, "##ܐ": 1119, "##เ": 1120, "##ქ": 1121, "##わ": 1122, "##ס": 1123, "##ɫ": 1124 } } }