vladiokc commited on
Commit
0d4d77e
1 Parent(s): 06508da

Upload 13 files

Browse files
Files changed (14) hide show
  1. .gitattributes +1 -0
  2. config.cfg +147 -0
  3. meta.json +58 -0
  4. ner/cfg +13 -0
  5. ner/model +0 -0
  6. ner/moves +1 -0
  7. tokenizer +3 -0
  8. transformer/cfg +3 -0
  9. transformer/model +3 -0
  10. vocab/key2row +1 -0
  11. vocab/lookups.bin +3 -0
  12. vocab/strings.json +1493 -0
  13. vocab/vectors +0 -0
  14. vocab/vectors.cfg +3 -0
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  model-best/transformer/model filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  model-best/transformer/model filter=lfs diff=lfs merge=lfs -text
37
+ transformer/model filter=lfs diff=lfs merge=lfs -text
config.cfg ADDED
@@ -0,0 +1,147 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [paths]
2
+ train = "./train_data.spacy"
3
+ dev = "./dev_data.spacy"
4
+ vectors = null
5
+ init_tok2vec = null
6
+
7
+ [system]
8
+ gpu_allocator = "pytorch"
9
+ seed = 0
10
+
11
+ [nlp]
12
+ lang = "it"
13
+ pipeline = ["transformer","ner"]
14
+ batch_size = 128
15
+ disabled = []
16
+ before_creation = null
17
+ after_creation = null
18
+ after_pipeline_creation = null
19
+ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
+ vectors = {"@vectors":"spacy.Vectors.v1"}
21
+
22
+ [components]
23
+
24
+ [components.ner]
25
+ factory = "ner"
26
+ incorrect_spans_key = null
27
+ moves = null
28
+ scorer = {"@scorers":"spacy.ner_scorer.v1"}
29
+ update_with_oracle_cut_size = 100
30
+
31
+ [components.ner.model]
32
+ @architectures = "spacy.TransitionBasedParser.v2"
33
+ state_type = "ner"
34
+ extra_state_tokens = false
35
+ hidden_width = 64
36
+ maxout_pieces = 2
37
+ use_upper = false
38
+ nO = null
39
+
40
+ [components.ner.model.tok2vec]
41
+ @architectures = "spacy-transformers.TransformerListener.v1"
42
+ grad_factor = 1.0
43
+ pooling = {"@layers":"reduce_mean.v1"}
44
+ upstream = "*"
45
+
46
+ [components.transformer]
47
+ factory = "transformer"
48
+ max_batch_items = 4096
49
+ set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
50
+
51
+ [components.transformer.model]
52
+ @architectures = "spacy-transformers.TransformerModel.v3"
53
+ name = "bert-base-multilingual-uncased"
54
+ mixed_precision = false
55
+
56
+ [components.transformer.model.get_spans]
57
+ @span_getters = "spacy-transformers.strided_spans.v1"
58
+ window = 128
59
+ stride = 96
60
+
61
+ [components.transformer.model.grad_scaler_config]
62
+
63
+ [components.transformer.model.tokenizer_config]
64
+ use_fast = true
65
+
66
+ [components.transformer.model.transformer_config]
67
+
68
+ [corpora]
69
+
70
+ [corpora.dev]
71
+ @readers = "spacy.Corpus.v1"
72
+ path = ${paths.dev}
73
+ max_length = 0
74
+ gold_preproc = false
75
+ limit = 0
76
+ augmenter = null
77
+
78
+ [corpora.train]
79
+ @readers = "spacy.Corpus.v1"
80
+ path = ${paths.train}
81
+ max_length = 0
82
+ gold_preproc = false
83
+ limit = 0
84
+ augmenter = null
85
+
86
+ [training]
87
+ dev_corpus = "corpora.dev"
88
+ train_corpus = "corpora.train"
89
+ seed = ${system.seed}
90
+ gpu_allocator = ${system.gpu_allocator}
91
+ dropout = 0.1
92
+ accumulate_gradient = 1
93
+ patience = 1600
94
+ max_epochs = 0
95
+ max_steps = 20000
96
+ eval_frequency = 200
97
+ frozen_components = []
98
+ annotating_components = []
99
+ before_to_disk = null
100
+ before_update = null
101
+
102
+ [training.batcher]
103
+ @batchers = "spacy.batch_by_padded.v1"
104
+ discard_oversize = true
105
+ size = 2000
106
+ buffer = 256
107
+ get_length = null
108
+
109
+ [training.logger]
110
+ @loggers = "spacy.ConsoleLogger.v1"
111
+ progress_bar = false
112
+
113
+ [training.optimizer]
114
+ @optimizers = "Adam.v1"
115
+ beta1 = 0.9
116
+ beta2 = 0.999
117
+ L2_is_weight_decay = true
118
+ L2 = 0.01
119
+ grad_clip = 1.0
120
+ use_averages = false
121
+ eps = 0.00000001
122
+
123
+ [training.optimizer.learn_rate]
124
+ @schedules = "warmup_linear.v1"
125
+ warmup_steps = 250
126
+ total_steps = 20000
127
+ initial_rate = 0.00005
128
+
129
+ [training.score_weights]
130
+ ents_f = 1.0
131
+ ents_p = 0.0
132
+ ents_r = 0.0
133
+ ents_per_type = null
134
+
135
+ [pretraining]
136
+
137
+ [initialize]
138
+ vectors = ${paths.vectors}
139
+ init_tok2vec = ${paths.init_tok2vec}
140
+ vocab_data = null
141
+ lookups = null
142
+ before_init = null
143
+ after_init = null
144
+
145
+ [initialize.components]
146
+
147
+ [initialize.tokenizer]
meta.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "lang":"it",
3
+ "name":"pipeline",
4
+ "version":"0.0.0",
5
+ "spacy_version":">=3.7.5,<3.8.0",
6
+ "description":"",
7
+ "author":"",
8
+ "email":"",
9
+ "url":"",
10
+ "license":"",
11
+ "spacy_git_version":"a6d0fc360",
12
+ "vectors":{
13
+ "width":0,
14
+ "vectors":0,
15
+ "keys":0,
16
+ "name":null,
17
+ "mode":"default"
18
+ },
19
+ "labels":{
20
+ "transformer":[
21
+
22
+ ],
23
+ "ner":[
24
+ "COMMAND",
25
+ "PERSON"
26
+ ]
27
+ },
28
+ "pipeline":[
29
+ "transformer",
30
+ "ner"
31
+ ],
32
+ "components":[
33
+ "transformer",
34
+ "ner"
35
+ ],
36
+ "disabled":[
37
+
38
+ ],
39
+ "performance":{
40
+ "ents_f":1.0,
41
+ "ents_p":1.0,
42
+ "ents_r":1.0,
43
+ "ents_per_type":{
44
+ "COMMAND":{
45
+ "p":1.0,
46
+ "r":1.0,
47
+ "f":1.0
48
+ },
49
+ "PERSON":{
50
+ "p":1.0,
51
+ "r":1.0,
52
+ "f":1.0
53
+ }
54
+ },
55
+ "transformer_loss":0.0000000512,
56
+ "ner_loss":9306.5799357916
57
+ }
58
+ }
ner/cfg ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "moves":null,
3
+ "update_with_oracle_cut_size":100,
4
+ "multitasks":[
5
+
6
+ ],
7
+ "min_action_freq":1,
8
+ "learn_tokens":false,
9
+ "beam_width":1,
10
+ "beam_density":0.0,
11
+ "beam_update_prob":0.0,
12
+ "incorrect_spans_key":null
13
+ }
ner/model ADDED
Binary file (213 kB). View file
 
ner/moves ADDED
@@ -0,0 +1 @@
 
 
1
+ ��movesٜ{"0":{},"1":{"COMMAND":894,"PERSON":718},"2":{"COMMAND":894,"PERSON":718},"3":{"COMMAND":894,"PERSON":718},"4":{"COMMAND":894,"PERSON":718,"":1},"5":{"":1}}�cfg��neg_key�
tokenizer ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ ��prefix_search� �^'[0-9][0-9]|^[0-9]+°|^§|^%|^=|^—|^–|^\+(?![0-9])|^…|^……|^,|^:|^;|^\!|^\?|^¿|^؟|^¡|^\(|^\)|^\[|^\]|^\{|^\}|^<|^>|^_|^#|^\*|^&|^。|^?|^!|^,|^、|^;|^:|^~|^·|^।|^،|^۔|^؛|^٪|^\.\.+|^…|^\'|^"|^”|^“|^`|^‘|^´|^’|^‚|^,|^„|^»|^«|^「|^」|^『|^』|^(|^)|^〔|^〕|^【|^】|^《|^》|^〈|^〉|^〈|^〉|^⟦|^⟧|^\$|^£|^€|^¥|^฿|^US\$|^C\$|^A\$|^₽|^﷼|^₴|^₠|^₡|^₢|^₣|^₤|^₥|^₦|^₧|^₨|^₩|^₪|^₫|^€|^₭|^₮|^₯|^₰|^₱|^₲|^₳|^₴|^₵|^₶|^₷|^₸|^₹|^₺|^₻|^₼|^₽|^₾|^₿|^[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]�suffix_search�2�…$|……$|,$|:$|;$|\!$|\?$|¿$|؟$|¡$|\($|\)$|\[$|\]$|\{$|\}$|<$|>$|_$|#$|\*$|&$|。$|?$|!$|,$|、$|;$|:$|~$|·$|।$|،$|۔$|؛$|٪$|\.\.+$|…$|\'$|"$|”$|“$|`$|‘$|´$|’$|‚$|,$|„$|»$|«$|「$|」$|『$|』$|($|)$|〔$|〕$|【$|】$|《$|》$|〈$|〉$|〈$|〉$|⟦$|⟧$|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]$|'s$|'S$|’s$|’S$|—$|–$|(?<=[0-9])\+$|(?<=°[FfCcKk])\.$|(?<=[0-9])(?:\$|£|€|¥|฿|US\$|C\$|A\$|₽|﷼|₴|₠|₡|₢|₣|₤|₥|₦|₧|₨|₩|₪|₫|€|₭|₮|₯|₰|₱|₲|₳|₴|₵|₶|₷|₸|₹|₺|₻|₼|₽|₾|₿)$|(?<=[0-9])(?:km|km²|km³|m|m²|m³|dm|dm²|dm³|cm|cm²|cm³|mm|mm²|mm³|ha|µm|nm|yd|in|ft|kg|g|mg|µg|t|lb|oz|m/s|km/h|kmh|mph|hPa|Pa|mbar|mb|MB|kb|KB|gb|GB|tb|TB|T|G|M|K|%|км|км²|км³|м|м²|м³|дм|дм²|дм³|см|см²|см³|мм|мм²|мм³|нм|кг|г|мг|м/с|км/ч|кПа|Па|мбар|Кб|КБ|кб|Мб|МБ|мб|Гб|ГБ|гб|Тб|ТБ|тбكم|كم²|كم³|م|م²|م³|سم|سم²|سم³|مم|مم²|مم³|كم|غرام|جرام|جم|كغ|ملغ|كوب|اكواب)$|(?<=[0-9a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F%²\-\+…|……|,|:|;|\!|\?|¿|؟|¡|\(|\)|\[|\]|\{|\}|<|>|_|#|\*|&|。|?|!|,|、|;|:|~|·|।|،|۔|؛|٪(?:\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉〈〉⟦⟧)])\.$|(?<=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F][A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])\.$�infix_finditer�O�\.\.+|…|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]|(?<=[0-9])[+\-\*^](?=[0-9-])|(?<=[a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉〈〉⟦⟧])\.(?=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉〈〉⟦⟧])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F]),(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])(?:-|–|—|--|---|——|~)(?=[a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F0-9])[:<>=\/](?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F]['’])(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F0-9\"])�token_match��url_match�
2
+ ��A�
3
+ � ��A� �'��A�'�''��A�''�(*_*)��A�(*_*)�(-8��A�(-8�(-:��A�(-:�(-;��A�(-;�(-_-)��A�(-_-)�(._.)��A�(._.)�(:��A�(:�(;��A�(;�(=��A�(=�(>_<)��A�(>_<)�(^_^)��A�(^_^)�(o:��A�(o:�(¬_¬)��A�(¬_¬)�(ಠ_ಠ)��A�(ಠ_ಠ)�(╯°□°)╯︵┻━┻��A�(╯°□°)╯︵┻━┻�)-:��A�)-:�):��A�):�-_-��A�-_-�-__-��A�-__-�..��A�..�....��A�....�._.��A�._.�0.0��A�0.0�0.o��A�0.o�0_0��A�0_0�0_o��A�0_o�8)��A�8)�8-)��A�8-)�8-D��A�8-D�8D��A�8D�:'(��A�:'(�:')��A�:')�:'-(��A�:'-(�:'-)��A�:'-)�:(��A�:(�:((��A�:((�:(((��A�:(((�:()��A�:()�:)��A�:)�:))��A�:))�:)))��A�:)))�:*��A�:*�:-(��A�:-(�:-((��A�:-((�:-(((��A�:-(((�:-)��A�:-)�:-))��A�:-))�:-)))��A�:-)))�:-*��A�:-*�:-/��A�:-/�:-0��A�:-0�:-3��A�:-3�:->��A�:->�:-D��A�:-D�:-O��A�:-O�:-P��A�:-P�:-X��A�:-X�:-]��A�:-]�:-o��A�:-o�:-p��A�:-p�:-x��A�:-x�:-|��A�:-|�:-}��A�:-}�:/��A�:/�:0��A�:0�:1��A�:1�:3��A�:3�:>��A�:>�:D��A�:D�:O��A�:O�:P��A�:P�:X��A�:X�:]��A�:]�:o��A�:o�:o)��A�:o)�:p��A�:p�:x��A�:x�:|��A�:|�:}��A�:}�:’(��A�:’(�:’)��A�:’)�:’-(��A�:’-(�:’-)��A�:’-)�;)��A�;)�;-)��A�;-)�;-D��A�;-D�;D��A�;D�;_;��A�;_;�<.<��A�<.<�</3��A�</3�<3��A�<3�<33��A�<33�<333��A�<333�<space>��A�<space>�=(��A�=(�=)��A�=)�=/��A�=/�=3��A�=3�=D��A�=D�=[��A�=[�=]��A�=]�=|��A�=|�>.<��A�>.<�>.>��A�>.>�>:(��A�>:(�>:o��A�>:o�><(((*>��A�><(((*>�@_@��A�@_@�Art.��A�Art.�Avv.��A�Avv.�C++��A�C++�C.so��A�C.so�Civ.��A�Civ.�Cod.��A�Cod.�Cost.��A�Cost.�E'��A�E'�E’��A�E’�Jr.��A�Jr.�L'art.��A�L'�A�art.�L’art.��A�L’�A�art.�O.O��A�O.O�O.o��A�O.o�O_O��A�O_O�O_o��A�O_o�Proc.��A�Proc.�St.��A�St.�V.V��A�V.V�V_V��A�V_V�XD��A�XD�XDD��A�XDD�[-:��A�[-:�[:��A�[:�[=��A�[=�\")��A�\")�\n��A�\n�\t��A�\t�]=��A�]=�^_^��A�^_^�^__^��A�^__^�^___^��A�^___^�a.��A�a.�a.C.��A�a.C.�al.��A�al.�all'art.��A�all'�A�art.�all-path��A�all-path�all’art.��A�all’�A�art.�art.��A�art.�artt.��A�artt.�att.��A�att.�avv.��A�avv.�b.��A�b.�by-pass��A�by-pass�c.��A�c.�c.d.��A�c.d.�c/c��A�c/c�centro-sinistra��A�centro-sinistra�check-up��A�check-up�cm.��A�cm.�col.��A�col.�d.��A�d.�d.C.��A�d.C.�dall'art.��A�dall'�A�art.�dall’art.��A�dall’�A�art.�de"��A�de"�dell'art.��A�dell'�A�art.�dell’art.��A�dell’�A�art.�distr.��A�distr.�e-mail��A�e-mail�e.��A�e.�e/o��A�e/o�ecc.��A�ecc.�etc.��A�etc.�f.��A�f.�g.��A�g.�h.��A�h.�i.��A�i.�j.��A�j.�k.��A�k.�l'art.��A�l'�A�art.�l.��A�l.�l’art.��A�l’�A�art.�m.��A�m.�n.��A�n.�nell'art.��A�nell'�A�art.�nell’art.��A�nell’�A�art.�nord-est��A�nord-est�n°��A�n°�o.��A�o.�o.0��A�o.0�o.O��A�o.O�o.o��A�o.o�o_0��A�o_0�o_O��A�o_O�o_o��A�o_o�p.��A�p.�pag.��A�pag.�po'��A�po'�po’��A�po’�prof.��A�prof.�q.��A�q.�r.��A�r.�s.��A�s.�s.n.c��A�s.n.c�s.p.a.��A�s.p.a.�s.r.l��A�s.r.l�sett.��A�sett.�sett..��A�sett.�A�.�ss.��A�ss.�t.��A�t.�tel.��A�tel.�u.��A�u.�v.��A�v.�v.v��A�v.v�v_v��A�v_v�w.��A�w.�week-end��A�week-end�x.��A�x.�xD��A�xD�xDD��A�xDD�y.��A�y.�z.��A�z.� ��A� C� �¯\(ツ)/¯��A�¯\(ツ)/¯�°C.��A�°�A�C�A�.�°F.��A�°�A�F�A�.�°K.��A�°�A�K�A�.�°c.��A�°�A�c�A�.�°f.��A�°�A�f�A�.�°k.��A�°�A�k�A�.�ä.��A�ä.�ö.��A�ö.�ü.��A�ü.�ಠ_ಠ��A�ಠ_ಠ�ಠ︵ಠ��A�ಠ︵ಠ�—��A�—�’��A�’�’’��A�’’�faster_heuristics�
transformer/cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "max_batch_items":4096
3
+ }
transformer/model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f23cadef2239affa1669e5ab1a4f91a2d1f1956991232a14145ed9b380df47e2
3
+ size 672942614
vocab/key2row ADDED
@@ -0,0 +1 @@
 
 
1
+
vocab/lookups.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76be8b528d0075f7aae98d6fa57a6d3c83ae480a8469e668d7b0af968995ac71
3
+ size 1
vocab/strings.json ADDED
@@ -0,0 +1,1493 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ "\t",
3
+ "\n",
4
+ "\r",
5
+ " ",
6
+ " ",
7
+ "\"",
8
+ "'",
9
+ "''",
10
+ "'-(",
11
+ "'-)",
12
+ "(",
13
+ "(((",
14
+ "(*>",
15
+ "(*_*)",
16
+ "(-8",
17
+ "(-:",
18
+ "(-;",
19
+ "(-_-)",
20
+ "(-d",
21
+ "(._.)",
22
+ "(:",
23
+ "(;",
24
+ "(=",
25
+ "(>_<)",
26
+ "(^_^)",
27
+ "(o:",
28
+ "(x:",
29
+ "(x_x)",
30
+ "(\u00ac_\u00ac)",
31
+ "(\u0ca0_\u0ca0)",
32
+ "(\u256f\u00b0\u25a1\u00b0\uff09\u256f\ufe35\u253b\u2501\u253b",
33
+ ")",
34
+ ")))",
35
+ ")-:",
36
+ ")/\u00af",
37
+ "):",
38
+ "*",
39
+ ",",
40
+ "-",
41
+ "-((",
42
+ "-))",
43
+ "-/",
44
+ "-0",
45
+ "-3",
46
+ "-8",
47
+ "-D",
48
+ "-O",
49
+ "-P",
50
+ "-X",
51
+ "-_-",
52
+ "-__-",
53
+ "-d",
54
+ "-o",
55
+ "-p",
56
+ "-up",
57
+ "-x",
58
+ "-|",
59
+ ".",
60
+ "..",
61
+ "...",
62
+ "....",
63
+ ".C.",
64
+ "._.",
65
+ ".a.",
66
+ ".d.",
67
+ ".so",
68
+ "/",
69
+ "/3",
70
+ "/d",
71
+ "0",
72
+ "0.0",
73
+ "0.o",
74
+ "0_0",
75
+ "0_o",
76
+ "1",
77
+ "3",
78
+ "33",
79
+ "333",
80
+ "8",
81
+ "8)",
82
+ "8-",
83
+ "8-)",
84
+ "8-D",
85
+ "8-d",
86
+ "8D",
87
+ "8d",
88
+ ":",
89
+ ":'(",
90
+ ":')",
91
+ ":'-(",
92
+ ":'-)",
93
+ ":(",
94
+ ":((",
95
+ ":(((",
96
+ ":()",
97
+ ":)",
98
+ ":))",
99
+ ":)))",
100
+ ":*",
101
+ ":-(",
102
+ ":-((",
103
+ ":-(((",
104
+ ":-)",
105
+ ":-))",
106
+ ":-)))",
107
+ ":-*",
108
+ ":-/",
109
+ ":-0",
110
+ ":-3",
111
+ ":->",
112
+ ":-D",
113
+ ":-O",
114
+ ":-P",
115
+ ":-X",
116
+ ":-]",
117
+ ":-d",
118
+ ":-o",
119
+ ":-p",
120
+ ":-x",
121
+ ":-|",
122
+ ":-}",
123
+ ":/",
124
+ ":0",
125
+ ":1",
126
+ ":3",
127
+ ":>",
128
+ ":D",
129
+ ":O",
130
+ ":P",
131
+ ":X",
132
+ ":]",
133
+ ":d",
134
+ ":o",
135
+ ":o)",
136
+ ":p",
137
+ ":x",
138
+ ":x)",
139
+ ":|",
140
+ ":}",
141
+ ":\u2019(",
142
+ ":\u2019)",
143
+ ":\u2019-(",
144
+ ":\u2019-)",
145
+ ";",
146
+ ";)",
147
+ ";-)",
148
+ ";-D",
149
+ ";-X",
150
+ ";-d",
151
+ ";D",
152
+ ";X",
153
+ ";_;",
154
+ ";d",
155
+ "<",
156
+ "<.<",
157
+ "</3",
158
+ "</d",
159
+ "<3",
160
+ "<33",
161
+ "<333",
162
+ "<d",
163
+ "<dd",
164
+ "<ddd",
165
+ "<space>",
166
+ "<xxxx>",
167
+ "=",
168
+ "=(",
169
+ "=)",
170
+ "=/",
171
+ "=3",
172
+ "=D",
173
+ "=X",
174
+ "=[",
175
+ "=]",
176
+ "=d",
177
+ "=|",
178
+ ">",
179
+ ">.<",
180
+ ">.>",
181
+ ">:(",
182
+ ">:o",
183
+ ">:x",
184
+ "><(((*>",
185
+ "@",
186
+ "@_@",
187
+ "A",
188
+ "AND",
189
+ "Abramo",
190
+ "Adone",
191
+ "Affonso",
192
+ "Agapito",
193
+ "Agata",
194
+ "Alba",
195
+ "Alberico",
196
+ "Alberta",
197
+ "Alberto",
198
+ "Aldo",
199
+ "Alexander",
200
+ "Alfaro",
201
+ "Alfeo",
202
+ "Alfonsi",
203
+ "Alfonso",
204
+ "Alla",
205
+ "Allesi",
206
+ "Altera",
207
+ "Alvise",
208
+ "Amando",
209
+ "Ambrogino",
210
+ "Ambrogio",
211
+ "Amore",
212
+ "Anacleto",
213
+ "Anastasio",
214
+ "Andreina",
215
+ "Angelico",
216
+ "Angelo",
217
+ "Angiolo",
218
+ "Arcuri",
219
+ "Armo",
220
+ "Arrigo",
221
+ "Arsenio",
222
+ "Art",
223
+ "Art.",
224
+ "Aurelio",
225
+ "Avv",
226
+ "Avv.",
227
+ "Azzurra",
228
+ "B",
229
+ "Balan",
230
+ "Baresi",
231
+ "Baroffio",
232
+ "Bellini",
233
+ "Bellucci",
234
+ "Beneventi",
235
+ "Bertoldo",
236
+ "Bethowen",
237
+ "Biagino",
238
+ "Bianchi",
239
+ "Big",
240
+ "Bonfilia",
241
+ "Borroni",
242
+ "Branson",
243
+ "Brichese",
244
+ "Bruno",
245
+ "Buccio",
246
+ "Buffon",
247
+ "Buratti",
248
+ "C",
249
+ "C++",
250
+ "C.",
251
+ "C.so",
252
+ "COMMAND",
253
+ "Cafaro",
254
+ "Cajetan",
255
+ "Calabresi",
256
+ "Campagna",
257
+ "Candreva",
258
+ "Cantu",
259
+ "Capone",
260
+ "Carlita",
261
+ "Carlota",
262
+ "Castiglione",
263
+ "Cecilio",
264
+ "Cedano",
265
+ "Celestina",
266
+ "Celso",
267
+ "Cesar",
268
+ "Chiara",
269
+ "Chiarina",
270
+ "Christian",
271
+ "Ciao",
272
+ "Ciccone",
273
+ "Cidano",
274
+ "Cittadino",
275
+ "Civ",
276
+ "Civ.",
277
+ "Clemente",
278
+ "Cleto",
279
+ "Cocci",
280
+ "Cociarelli",
281
+ "Cod",
282
+ "Cod.",
283
+ "Colombina",
284
+ "Colombo",
285
+ "Consoli",
286
+ "Conti",
287
+ "Cost",
288
+ "Cost.",
289
+ "Costantino",
290
+ "Crispino",
291
+ "Cristiano",
292
+ "Cristoforo",
293
+ "D",
294
+ "D'",
295
+ "Damiano",
296
+ "Dan",
297
+ "Daniele",
298
+ "Dario",
299
+ "Davide",
300
+ "De",
301
+ "Demi",
302
+ "Desideria",
303
+ "Desiderio",
304
+ "Detti",
305
+ "Di",
306
+ "Dino",
307
+ "Doe",
308
+ "Dona",
309
+ "Donatella",
310
+ "Donati",
311
+ "Donato",
312
+ "Donini",
313
+ "Dorotea",
314
+ "Duca",
315
+ "Durante",
316
+ "E",
317
+ "E'",
318
+ "Edmonda",
319
+ "Elario",
320
+ "Elena",
321
+ "Eligio",
322
+ "Elma",
323
+ "Elmo",
324
+ "Emiliano",
325
+ "Endrizzi",
326
+ "Eneide",
327
+ "Enrichetta",
328
+ "Ermete",
329
+ "Erminio",
330
+ "Esparza",
331
+ "Ezzelin",
332
+ "E\u2019",
333
+ "F",
334
+ "F.",
335
+ "Fabio",
336
+ "Fanucci",
337
+ "Fausto",
338
+ "Felice",
339
+ "Fel\u00eccita",
340
+ "Ferrari",
341
+ "Ferruccio",
342
+ "Fiammetta",
343
+ "Filberto",
344
+ "Filomena",
345
+ "Fiorella",
346
+ "Fiorentini",
347
+ "Fiorentino",
348
+ "Fiorenzo",
349
+ "Florentina",
350
+ "Fontana",
351
+ "Fortunata",
352
+ "Franca",
353
+ "Franco",
354
+ "Fulvia",
355
+ "Fulvio",
356
+ "G",
357
+ "Gabriella",
358
+ "Gallo",
359
+ "Garcia",
360
+ "Gelli",
361
+ "Gemma",
362
+ "Genera",
363
+ "General",
364
+ "Generale",
365
+ "Gennaro",
366
+ "Genoveffa",
367
+ "Genovese",
368
+ "Genovesi",
369
+ "Gentilini",
370
+ "Gerardo",
371
+ "Giacomo",
372
+ "Gianni",
373
+ "Ginevra",
374
+ "Gino",
375
+ "Gioconda",
376
+ "Giordano",
377
+ "Giorgina",
378
+ "Giovanna",
379
+ "Giovinco",
380
+ "Giulia",
381
+ "Giustina",
382
+ "Giustino",
383
+ "Goffredo",
384
+ "Golino",
385
+ "Great",
386
+ "Greco",
387
+ "Greece",
388
+ "Gregario",
389
+ "Gucci",
390
+ "H",
391
+ "Hailey",
392
+ "I",
393
+ "IOA",
394
+ "Iadanza",
395
+ "Ignazio",
396
+ "Ilaria",
397
+ "Imelda",
398
+ "Immacolata",
399
+ "In",
400
+ "Ingegnere",
401
+ "Ingegner\u00e0",
402
+ "Insigne",
403
+ "Invia",
404
+ "J",
405
+ "Jacopo",
406
+ "Jemma",
407
+ "John",
408
+ "Jolanda",
409
+ "Jr",
410
+ "Jr.",
411
+ "K",
412
+ "K.",
413
+ "L",
414
+ "L'",
415
+ "L'art.",
416
+ "Lalia",
417
+ "Leonzio",
418
+ "Letizia",
419
+ "Lettiere",
420
+ "Lia",
421
+ "Livio",
422
+ "Lo",
423
+ "Locatello",
424
+ "Loggia",
425
+ "Lombardi",
426
+ "Longo",
427
+ "Lorenzo",
428
+ "Loreto",
429
+ "Lori",
430
+ "Lothario",
431
+ "Luca",
432
+ "Lucchesi",
433
+ "Lucciano",
434
+ "Ludovica",
435
+ "Ludovico",
436
+ "Luig",
437
+ "Luigina",
438
+ "L\u2019",
439
+ "L\u2019art.",
440
+ "M",
441
+ "Madeleine",
442
+ "Malvolia",
443
+ "Mancini",
444
+ "Manlio",
445
+ "Manna",
446
+ "Marcello",
447
+ "Marco",
448
+ "Mariella",
449
+ "Marietta",
450
+ "Marino",
451
+ "Marotta",
452
+ "Marta",
453
+ "Marzio",
454
+ "Mazzi",
455
+ "Melania",
456
+ "Melchiorre",
457
+ "Meo",
458
+ "Mike",
459
+ "Milano",
460
+ "Mirella",
461
+ "Modesto",
462
+ "Mona",
463
+ "Moretti",
464
+ "Moze",
465
+ "N",
466
+ "Napolitani",
467
+ "Natanaele",
468
+ "Necci",
469
+ "Neri",
470
+ "Nicola",
471
+ "Nicol\u00f2",
472
+ "Nino",
473
+ "Noelia",
474
+ "Noemi",
475
+ "O",
476
+ "O.O",
477
+ "O.o",
478
+ "O_O",
479
+ "O_o",
480
+ "Offredi",
481
+ "Onio",
482
+ "Orabella",
483
+ "Orsina",
484
+ "Oscuro",
485
+ "Ossani",
486
+ "Ottaviano",
487
+ "Ottavio",
488
+ "P",
489
+ "Paccioretti",
490
+ "Pagnotto",
491
+ "Palazzo",
492
+ "Palerma",
493
+ "Palermo",
494
+ "Panicucci",
495
+ "Paolina",
496
+ "Passero",
497
+ "Paul",
498
+ "Per",
499
+ "Piazza",
500
+ "Piccio",
501
+ "Piera",
502
+ "Piero",
503
+ "Pirozzi",
504
+ "Pisano",
505
+ "Porto",
506
+ "Proc",
507
+ "Proc.",
508
+ "Prospero",
509
+ "R",
510
+ "ROOT",
511
+ "Raniero",
512
+ "Report",
513
+ "Riccardo",
514
+ "Ricci",
515
+ "Rinaldo",
516
+ "Rivera",
517
+ "Romani",
518
+ "Romano",
519
+ "Romhilda",
520
+ "Rosannah",
521
+ "Rose",
522
+ "Rosiello",
523
+ "Rosina",
524
+ "Rossi",
525
+ "Rua",
526
+ "Russo",
527
+ "S",
528
+ "SON",
529
+ "Sabbatini",
530
+ "Sal",
531
+ "Salve",
532
+ "Samuele",
533
+ "Santa",
534
+ "Scarica",
535
+ "Serafina",
536
+ "Serafino",
537
+ "Sesto",
538
+ "Settimio",
539
+ "Severiano",
540
+ "Shepherd",
541
+ "Siciliano",
542
+ "Silvana",
543
+ "Small",
544
+ "Spours",
545
+ "St",
546
+ "St.",
547
+ "Stefania",
548
+ "Stephen",
549
+ "Strinati",
550
+ "T",
551
+ "Teodosio",
552
+ "Terenzio",
553
+ "Terzo",
554
+ "The",
555
+ "Thornton",
556
+ "Tino",
557
+ "To",
558
+ "Tocci",
559
+ "Tonia",
560
+ "Toscani",
561
+ "Trentini",
562
+ "U",
563
+ "Udinese",
564
+ "Udinesi",
565
+ "Umberto",
566
+ "Un",
567
+ "Underwoodn",
568
+ "V",
569
+ "V.V",
570
+ "V_V",
571
+ "Valeriano",
572
+ "Van",
573
+ "Vanna",
574
+ "Vecellio",
575
+ "Vecoli",
576
+ "Venceslao",
577
+ "Venturi",
578
+ "Verratti",
579
+ "Via",
580
+ "Vicenzo",
581
+ "Vinicio",
582
+ "Violante",
583
+ "Violetta",
584
+ "Virgilio",
585
+ "Vittoria",
586
+ "Voleo",
587
+ "Volta",
588
+ "X'",
589
+ "X'xxx.",
590
+ "X++",
591
+ "X.",
592
+ "X.X",
593
+ "X.x",
594
+ "X.xx",
595
+ "XD",
596
+ "XDD",
597
+ "XX",
598
+ "XXX",
599
+ "XXXX",
600
+ "X_X",
601
+ "X_x",
602
+ "Xx",
603
+ "Xx.",
604
+ "Xxx",
605
+ "Xxx.",
606
+ "Xxxx",
607
+ "Xxxx.",
608
+ "Xxxxx",
609
+ "X\u2019",
610
+ "X\u2019xxx.",
611
+ "Z",
612
+ "Zetticci",
613
+ "Zita",
614
+ "Zito",
615
+ "[",
616
+ "[-:",
617
+ "[:",
618
+ "[=",
619
+ "\\",
620
+ "\\\")",
621
+ "\\n",
622
+ "\\t",
623
+ "\\x",
624
+ "]",
625
+ "]=",
626
+ "^",
627
+ "^_^",
628
+ "^__^",
629
+ "^___^",
630
+ "_*)",
631
+ "_-)",
632
+ "_.)",
633
+ "_<)",
634
+ "_^)",
635
+ "__-",
636
+ "__^",
637
+ "_\u00ac)",
638
+ "_\u0ca0)",
639
+ "a",
640
+ "a.",
641
+ "a.C.",
642
+ "a.c.",
643
+ "abramo",
644
+ "ace",
645
+ "adone",
646
+ "adriana",
647
+ "affonso",
648
+ "ag.",
649
+ "agapito",
650
+ "agata",
651
+ "ail",
652
+ "al",
653
+ "al.",
654
+ "alba",
655
+ "albano",
656
+ "alberico",
657
+ "alberta",
658
+ "alberto",
659
+ "aldo",
660
+ "ale",
661
+ "alexander",
662
+ "alfaro",
663
+ "alfeo",
664
+ "alfonsi",
665
+ "alfonso",
666
+ "all",
667
+ "all'",
668
+ "all'art.",
669
+ "all-path",
670
+ "alla",
671
+ "allesi",
672
+ "all\u2019",
673
+ "all\u2019art.",
674
+ "altera",
675
+ "alvise",
676
+ "amando",
677
+ "ambrogino",
678
+ "ambrogio",
679
+ "amigo",
680
+ "amo",
681
+ "amore",
682
+ "ana",
683
+ "anacleto",
684
+ "anastasio",
685
+ "andreina",
686
+ "angelico",
687
+ "angelo",
688
+ "angiolo",
689
+ "ani",
690
+ "anjelica",
691
+ "ano",
692
+ "ara",
693
+ "arcuri",
694
+ "are",
695
+ "ari",
696
+ "armo",
697
+ "aro",
698
+ "arrigo",
699
+ "arsenio",
700
+ "art",
701
+ "art.",
702
+ "artt",
703
+ "artt.",
704
+ "ass",
705
+ "ata",
706
+ "ath",
707
+ "ati",
708
+ "ato",
709
+ "att",
710
+ "att.",
711
+ "aul",
712
+ "aurelio",
713
+ "avv",
714
+ "avv.",
715
+ "azzurra",
716
+ "b",
717
+ "b.",
718
+ "balan",
719
+ "baresi",
720
+ "baroffio",
721
+ "bella",
722
+ "bellini",
723
+ "bellucci",
724
+ "beneventi",
725
+ "bertoldo",
726
+ "bethowen",
727
+ "biagino",
728
+ "biagio",
729
+ "bianchi",
730
+ "big",
731
+ "bio",
732
+ "bonfilia",
733
+ "borroni",
734
+ "bot",
735
+ "branson",
736
+ "brichese",
737
+ "bruno",
738
+ "buccio",
739
+ "buffon",
740
+ "buongiorno",
741
+ "buratti",
742
+ "by",
743
+ "by-pass",
744
+ "c",
745
+ "c++",
746
+ "c.",
747
+ "c.d",
748
+ "c.d.",
749
+ "c.so",
750
+ "c/c",
751
+ "cIOA",
752
+ "cafaro",
753
+ "cajetan",
754
+ "calabresi",
755
+ "campagna",
756
+ "candreva",
757
+ "cantu",
758
+ "capone",
759
+ "carlita",
760
+ "carlota",
761
+ "caro",
762
+ "castiglione",
763
+ "cc.",
764
+ "cci",
765
+ "ce>",
766
+ "cecilio",
767
+ "cedano",
768
+ "celestina",
769
+ "celso",
770
+ "centro",
771
+ "centro-sinistra",
772
+ "cesar",
773
+ "check",
774
+ "check-up",
775
+ "chi",
776
+ "chiara",
777
+ "chiarina",
778
+ "christian",
779
+ "cia",
780
+ "ciao",
781
+ "ciccone",
782
+ "cidano",
783
+ "cio",
784
+ "cioa",
785
+ "cittadino",
786
+ "civ",
787
+ "civ.",
788
+ "clemente",
789
+ "cleto",
790
+ "cm",
791
+ "cm.",
792
+ "cocci",
793
+ "cociarelli",
794
+ "cod",
795
+ "cod.",
796
+ "col",
797
+ "col.",
798
+ "colombina",
799
+ "colombo",
800
+ "command",
801
+ "consoli",
802
+ "conti",
803
+ "cost",
804
+ "cost.",
805
+ "costantino",
806
+ "crispino",
807
+ "cristiano",
808
+ "cristoforo",
809
+ "crocetta",
810
+ "d",
811
+ "d'",
812
+ "d)",
813
+ "d-",
814
+ "d-)",
815
+ "d-X",
816
+ "d.",
817
+ "d.C.",
818
+ "d.c.",
819
+ "d.d",
820
+ "d.x",
821
+ "dX",
822
+ "d_d",
823
+ "d_x",
824
+ "dall'",
825
+ "dall'art.",
826
+ "dall\u2019",
827
+ "dall\u2019art.",
828
+ "damiano",
829
+ "dan",
830
+ "daniele",
831
+ "dario",
832
+ "davide",
833
+ "dd",
834
+ "ddd",
835
+ "de",
836
+ "de\"",
837
+ "del",
838
+ "dell'",
839
+ "dell'art.",
840
+ "dell\u2019",
841
+ "dell\u2019art.",
842
+ "demi",
843
+ "der",
844
+ "desideria",
845
+ "desiderio",
846
+ "detti",
847
+ "di",
848
+ "dino",
849
+ "dio",
850
+ "distr",
851
+ "distr.",
852
+ "doe",
853
+ "dona",
854
+ "donata",
855
+ "donatella",
856
+ "donati",
857
+ "donato",
858
+ "donini",
859
+ "dorotea",
860
+ "duca",
861
+ "dude",
862
+ "durante",
863
+ "e",
864
+ "e'",
865
+ "e-mail",
866
+ "e.",
867
+ "e/o",
868
+ "eat",
869
+ "ecc",
870
+ "ecc.",
871
+ "ece",
872
+ "eck",
873
+ "eco",
874
+ "edi",
875
+ "edmonda",
876
+ "edo",
877
+ "eek",
878
+ "el.",
879
+ "elario",
880
+ "ele",
881
+ "elena",
882
+ "elia",
883
+ "eligio",
884
+ "elma",
885
+ "elmo",
886
+ "elo",
887
+ "elpidio",
888
+ "email",
889
+ "emaill",
890
+ "emi",
891
+ "emiliano",
892
+ "ena",
893
+ "end",
894
+ "endrizzi",
895
+ "eneide",
896
+ "enrichetta",
897
+ "era",
898
+ "erd",
899
+ "ere",
900
+ "eri",
901
+ "ermete",
902
+ "erminio",
903
+ "ero",
904
+ "er\u00e0",
905
+ "ese",
906
+ "esi",
907
+ "esparza",
908
+ "esposito",
909
+ "est",
910
+ "etc",
911
+ "etc.",
912
+ "ete",
913
+ "eto",
914
+ "ett",
915
+ "eva",
916
+ "ezzelin",
917
+ "e\u2019",
918
+ "f",
919
+ "f.",
920
+ "fabio",
921
+ "fabrizio",
922
+ "fanucci",
923
+ "fausto",
924
+ "favore",
925
+ "fazio",
926
+ "felice",
927
+ "fel\u00eccita",
928
+ "feo",
929
+ "ferrari",
930
+ "ferruccio",
931
+ "ffa",
932
+ "fiammetta",
933
+ "filberto",
934
+ "filomena",
935
+ "fio",
936
+ "fiorella",
937
+ "fiorentini",
938
+ "fiorentino",
939
+ "fiorenza",
940
+ "fiorenzo",
941
+ "florentina",
942
+ "folliero",
943
+ "fon",
944
+ "fontana",
945
+ "fortunata",
946
+ "franca",
947
+ "franco",
948
+ "fulvia",
949
+ "fulvio",
950
+ "g",
951
+ "g.",
952
+ "gabriella",
953
+ "gallo",
954
+ "garcia",
955
+ "gelli",
956
+ "gemma",
957
+ "genera",
958
+ "general",
959
+ "generale",
960
+ "generare",
961
+ "gennaro",
962
+ "genoveffa",
963
+ "genovese",
964
+ "genovesi",
965
+ "gentilini",
966
+ "gerardo",
967
+ "gia",
968
+ "giacomo",
969
+ "gianni",
970
+ "ginevra",
971
+ "gino",
972
+ "gio",
973
+ "gioconda",
974
+ "giordano",
975
+ "giorgina",
976
+ "giovanna",
977
+ "giovinco",
978
+ "girolamo",
979
+ "giulia",
980
+ "giustina",
981
+ "giustino",
982
+ "gna",
983
+ "gne",
984
+ "goffredo",
985
+ "golino",
986
+ "great",
987
+ "greco",
988
+ "greece",
989
+ "gregario",
990
+ "gucci",
991
+ "h",
992
+ "h.",
993
+ "hailey",
994
+ "hen",
995
+ "i",
996
+ "i.",
997
+ "iadanza",
998
+ "ian",
999
+ "iao",
1000
+ "ica",
1001
+ "ice",
1002
+ "ico",
1003
+ "ide",
1004
+ "ignazio",
1005
+ "igo",
1006
+ "ike",
1007
+ "il",
1008
+ "ilaria",
1009
+ "ill",
1010
+ "imelda",
1011
+ "immacolata",
1012
+ "in",
1013
+ "ina",
1014
+ "ine",
1015
+ "ingegnere",
1016
+ "ingegner\u00e0",
1017
+ "ini",
1018
+ "innocenzo",
1019
+ "ino",
1020
+ "insigne",
1021
+ "invia",
1022
+ "ioa",
1023
+ "ise",
1024
+ "it",
1025
+ "ita",
1026
+ "ito",
1027
+ "iv.",
1028
+ "j",
1029
+ "j.",
1030
+ "jacopo",
1031
+ "jemma",
1032
+ "jilani",
1033
+ "john",
1034
+ "jolanda",
1035
+ "jr",
1036
+ "jr.",
1037
+ "k",
1038
+ "k.",
1039
+ "l",
1040
+ "l'",
1041
+ "l'art.",
1042
+ "l.",
1043
+ "lalia",
1044
+ "lan",
1045
+ "lao",
1046
+ "lauro",
1047
+ "lba",
1048
+ "lda",
1049
+ "ldo",
1050
+ "leo",
1051
+ "leonzio",
1052
+ "letizia",
1053
+ "lettiere",
1054
+ "ley",
1055
+ "lia",
1056
+ "lin",
1057
+ "lio",
1058
+ "livio",
1059
+ "ll'",
1060
+ "lla",
1061
+ "lli",
1062
+ "llo",
1063
+ "ll\u2019",
1064
+ "lma",
1065
+ "lmo",
1066
+ "lo",
1067
+ "locatello",
1068
+ "loggia",
1069
+ "lombardi",
1070
+ "longo",
1071
+ "lorenzo",
1072
+ "loreto",
1073
+ "lori",
1074
+ "lothario",
1075
+ "lso",
1076
+ "lta",
1077
+ "luca",
1078
+ "lucchesi",
1079
+ "lucciano",
1080
+ "ludovica",
1081
+ "ludovico",
1082
+ "luig",
1083
+ "luigina",
1084
+ "lve",
1085
+ "l\u2019",
1086
+ "l\u2019art.",
1087
+ "m",
1088
+ "m.",
1089
+ "madeleine",
1090
+ "mail",
1091
+ "malvolia",
1092
+ "mancini",
1093
+ "manlio",
1094
+ "manna",
1095
+ "marcello",
1096
+ "marco",
1097
+ "mariella",
1098
+ "marietta",
1099
+ "marino",
1100
+ "marotta",
1101
+ "marta",
1102
+ "marzio",
1103
+ "mazzi",
1104
+ "mbo",
1105
+ "melania",
1106
+ "melchiorre",
1107
+ "meo",
1108
+ "mike",
1109
+ "milano",
1110
+ "mio",
1111
+ "mirella",
1112
+ "mma",
1113
+ "modesto",
1114
+ "mona",
1115
+ "moretti",
1116
+ "moze",
1117
+ "n",
1118
+ "n.",
1119
+ "n.c",
1120
+ "nah",
1121
+ "napolitani",
1122
+ "natanaele",
1123
+ "nca",
1124
+ "nco",
1125
+ "nda",
1126
+ "ndo",
1127
+ "necci",
1128
+ "nell'",
1129
+ "nell'art.",
1130
+ "nell\u2019",
1131
+ "nell\u2019art.",
1132
+ "neri",
1133
+ "ngo",
1134
+ "nia",
1135
+ "nicola",
1136
+ "nicol\u00f2",
1137
+ "nicomedo",
1138
+ "nino",
1139
+ "nio",
1140
+ "nna",
1141
+ "nni",
1142
+ "noelia",
1143
+ "noemi",
1144
+ "nord",
1145
+ "nord-est",
1146
+ "nsi",
1147
+ "nso",
1148
+ "nta",
1149
+ "nte",
1150
+ "nti",
1151
+ "nto",
1152
+ "ntu",
1153
+ "nza",
1154
+ "nzo",
1155
+ "n\u00b0",
1156
+ "o",
1157
+ "o.",
1158
+ "o.0",
1159
+ "o.O",
1160
+ "o.o",
1161
+ "o_0",
1162
+ "o_O",
1163
+ "o_o",
1164
+ "oc.",
1165
+ "od.",
1166
+ "odn",
1167
+ "of.",
1168
+ "offredi",
1169
+ "ohn",
1170
+ "ol.",
1171
+ "ola",
1172
+ "oli",
1173
+ "olo",
1174
+ "ol\u00f2",
1175
+ "omo",
1176
+ "ona",
1177
+ "one",
1178
+ "oni",
1179
+ "onio",
1180
+ "opo",
1181
+ "orabella",
1182
+ "ord",
1183
+ "ore",
1184
+ "ori",
1185
+ "oro",
1186
+ "orsina",
1187
+ "ort",
1188
+ "oscuro",
1189
+ "ose",
1190
+ "ossani",
1191
+ "ost",
1192
+ "ota",
1193
+ "ottaviano",
1194
+ "ottavio",
1195
+ "oze",
1196
+ "p",
1197
+ "p.",
1198
+ "p.a",
1199
+ "paccioretti",
1200
+ "pag",
1201
+ "pag.",
1202
+ "pagnotto",
1203
+ "palazzo",
1204
+ "palerma",
1205
+ "palermo",
1206
+ "panicucci",
1207
+ "paolina",
1208
+ "pass",
1209
+ "passero",
1210
+ "path",
1211
+ "paul",
1212
+ "per",
1213
+ "person",
1214
+ "persona",
1215
+ "piazza",
1216
+ "piccio",
1217
+ "piera",
1218
+ "piero",
1219
+ "pietronella",
1220
+ "pino",
1221
+ "pinto",
1222
+ "pirozzi",
1223
+ "pisano",
1224
+ "po",
1225
+ "po'",
1226
+ "port",
1227
+ "porte",
1228
+ "porto",
1229
+ "po\u2019",
1230
+ "proc",
1231
+ "proc.",
1232
+ "prof",
1233
+ "prof.",
1234
+ "prospero",
1235
+ "q",
1236
+ "q.",
1237
+ "r",
1238
+ "r.",
1239
+ "r.l",
1240
+ "ral",
1241
+ "raniero",
1242
+ "rco",
1243
+ "rdi",
1244
+ "rdo",
1245
+ "report",
1246
+ "ria",
1247
+ "riccardo",
1248
+ "ricci",
1249
+ "rinaldo",
1250
+ "rio",
1251
+ "riporto",
1252
+ "rivera",
1253
+ "rma",
1254
+ "rmo",
1255
+ "rno",
1256
+ "robot",
1257
+ "roc",
1258
+ "rof",
1259
+ "romani",
1260
+ "romano",
1261
+ "romhilda",
1262
+ "rosannah",
1263
+ "rose",
1264
+ "rosiello",
1265
+ "rosina",
1266
+ "rossi",
1267
+ "rra",
1268
+ "rre",
1269
+ "rt.",
1270
+ "rta",
1271
+ "rte",
1272
+ "rto",
1273
+ "rtt",
1274
+ "rua",
1275
+ "russo",
1276
+ "rza",
1277
+ "rzo",
1278
+ "s",
1279
+ "s.",
1280
+ "s.n.c",
1281
+ "s.p.a",
1282
+ "s.p.a.",
1283
+ "s.r.l",
1284
+ "sabbatini",
1285
+ "sal",
1286
+ "salve",
1287
+ "samuele",
1288
+ "santa",
1289
+ "sar",
1290
+ "scarica",
1291
+ "scaricare",
1292
+ "serafina",
1293
+ "serafino",
1294
+ "sesto",
1295
+ "sett",
1296
+ "sett.",
1297
+ "sett..",
1298
+ "settimio",
1299
+ "severiano",
1300
+ "shepherd",
1301
+ "siciliano",
1302
+ "silvana",
1303
+ "sinistra",
1304
+ "sio",
1305
+ "small",
1306
+ "son",
1307
+ "space",
1308
+ "spours",
1309
+ "ss",
1310
+ "ss.",
1311
+ "ssi",
1312
+ "sso",
1313
+ "st",
1314
+ "st.",
1315
+ "stefania",
1316
+ "stephen",
1317
+ "sto",
1318
+ "str",
1319
+ "strinati",
1320
+ "t",
1321
+ "t.",
1322
+ "t..",
1323
+ "tan",
1324
+ "tc.",
1325
+ "tea",
1326
+ "tel",
1327
+ "tel.",
1328
+ "teodosio",
1329
+ "terenzio",
1330
+ "terzo",
1331
+ "the",
1332
+ "thornton",
1333
+ "tino",
1334
+ "to",
1335
+ "tocci",
1336
+ "ton",
1337
+ "tonia",
1338
+ "toscani",
1339
+ "tr.",
1340
+ "tra",
1341
+ "trentini",
1342
+ "tro",
1343
+ "tt.",
1344
+ "tta",
1345
+ "tti",
1346
+ "tto",
1347
+ "u",
1348
+ "u.",
1349
+ "uca",
1350
+ "ude",
1351
+ "udinese",
1352
+ "udinesi",
1353
+ "uig",
1354
+ "umberto",
1355
+ "un",
1356
+ "una",
1357
+ "underwoodn",
1358
+ "uno",
1359
+ "up",
1360
+ "uri",
1361
+ "uro",
1362
+ "urs",
1363
+ "utente",
1364
+ "v",
1365
+ "v.",
1366
+ "v.v",
1367
+ "v_v",
1368
+ "valeriano",
1369
+ "van",
1370
+ "vanna",
1371
+ "vecellio",
1372
+ "vecoli",
1373
+ "venceslao",
1374
+ "venturi",
1375
+ "verratti",
1376
+ "via",
1377
+ "vicenzo",
1378
+ "vinicio",
1379
+ "vio",
1380
+ "violante",
1381
+ "violetta",
1382
+ "virgilio",
1383
+ "vittoria",
1384
+ "voleo",
1385
+ "volta",
1386
+ "vra",
1387
+ "vv.",
1388
+ "w",
1389
+ "w.",
1390
+ "week",
1391
+ "week-end",
1392
+ "wen",
1393
+ "x",
1394
+ "x'",
1395
+ "x'xxx.",
1396
+ "x-xxxx",
1397
+ "x.",
1398
+ "x.X",
1399
+ "x.X.",
1400
+ "x.d",
1401
+ "x.x",
1402
+ "x.x.",
1403
+ "x.x.x",
1404
+ "x.x.x.",
1405
+ "x/x",
1406
+ "xD",
1407
+ "xDD",
1408
+ "xX",
1409
+ "xXX",
1410
+ "xXXX",
1411
+ "x_X",
1412
+ "x_d",
1413
+ "x_x",
1414
+ "xd",
1415
+ "xdd",
1416
+ "xx",
1417
+ "xx\"",
1418
+ "xx'",
1419
+ "xx-xxxx",
1420
+ "xx.",
1421
+ "xxx",
1422
+ "xxx'",
1423
+ "xxx'xxx.",
1424
+ "xxx-xxxx",
1425
+ "xxx.",
1426
+ "xxxx",
1427
+ "xxxx'",
1428
+ "xxxx'xxx.",
1429
+ "xxxx-xx",
1430
+ "xxxx-xxx",
1431
+ "xxxx-xxxx",
1432
+ "xxxx.",
1433
+ "xxxx..",
1434
+ "xxxx\u2019",
1435
+ "xxxx\u2019xxx.",
1436
+ "xxx\u2019",
1437
+ "xxx\u2019xxx.",
1438
+ "xx\u2019",
1439
+ "x\u00b0",
1440
+ "x\u2019",
1441
+ "x\u2019xxx.",
1442
+ "x\ufe35x",
1443
+ "y",
1444
+ "y.",
1445
+ "z",
1446
+ "z.",
1447
+ "zetticci",
1448
+ "zia",
1449
+ "zio",
1450
+ "zita",
1451
+ "zito",
1452
+ "zza",
1453
+ "zzi",
1454
+ "zzo",
1455
+ "|",
1456
+ "}",
1457
+ "\u00a0",
1458
+ "\u00ac",
1459
+ "\u00ac_\u00ac",
1460
+ "\u00af",
1461
+ "\u00af\\(x)/\u00af",
1462
+ "\u00af\\(\u30c4)/\u00af",
1463
+ "\u00b0",
1464
+ "\u00b0C.",
1465
+ "\u00b0F.",
1466
+ "\u00b0K.",
1467
+ "\u00b0X.",
1468
+ "\u00b0c.",
1469
+ "\u00b0f.",
1470
+ "\u00b0k.",
1471
+ "\u00b0x.",
1472
+ "\u00e4",
1473
+ "\u00e4.",
1474
+ "\u00f6",
1475
+ "\u00f6.",
1476
+ "\u00fc",
1477
+ "\u00fc.",
1478
+ "\u0ca0",
1479
+ "\u0ca0_\u0ca0",
1480
+ "\u0ca0\ufe35\u0ca0",
1481
+ "\u2014",
1482
+ "\u2019",
1483
+ "\u2019-(",
1484
+ "\u2019-)",
1485
+ "\u2019\u2019",
1486
+ "\u2501",
1487
+ "\u253b",
1488
+ "\u253b\u2501\u253b",
1489
+ "\u256f",
1490
+ "\u25a1",
1491
+ "\ufe35",
1492
+ "\uff09"
1493
+ ]
vocab/vectors ADDED
Binary file (128 Bytes). View file
 
vocab/vectors.cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "mode":"default"
3
+ }