Python commited on
Commit
1ca4f66
1 Parent(s): 6317be9

Upload 5 files

Browse files
config.json ADDED
@@ -0,0 +1,244 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Python/ACROSS-m2o-eng-small",
3
+ "architectures": [
4
+ "MT5ForConditionalGeneration"
5
+ ],
6
+ "consistency_loss_weight": 2.0,
7
+ "consistency_temperature": 1.0,
8
+ "contrastive": true,
9
+ "contrastive_mini_batch_size": 4,
10
+ "cross_alignment_loss_weight": 1.0,
11
+ "d_ff": 1024,
12
+ "d_kv": 64,
13
+ "d_model": 512,
14
+ "decoder_start_token_id": 0,
15
+ "dropout_rate": 0.1,
16
+ "eos_token_id": 1,
17
+ "feature_pooling_method": "mean_pooling",
18
+ "feed_forward_proj": "gated-gelu",
19
+ "freeze_decoder": false,
20
+ "freeze_mono_encoder": true,
21
+ "initializer_factor": 1.0,
22
+ "is_encoder_decoder": true,
23
+ "layer_norm_epsilon": 1e-06,
24
+ "length_penalty": 0.6,
25
+ "max_length": 84,
26
+ "model_type": "mt5",
27
+ "num_beams": 4,
28
+ "num_decoder_layers": 8,
29
+ "num_heads": 6,
30
+ "num_layers": 8,
31
+ "pad_token_id": 0,
32
+ "queue_size": 8192,
33
+ "relative_attention_num_buckets": 32,
34
+ "similarity_method": "cosine",
35
+ "t5_path_or_url": "output/eng2eng_small_baseline_A5000",
36
+ "task_specific_params": {
37
+ "langid_map": {
38
+ "amharic": [
39
+ 39,
40
+ "\u2581<extra_id_64>"
41
+ ],
42
+ "arabic": [
43
+ 8,
44
+ "\u2581<extra_id_95>"
45
+ ],
46
+ "azerbaijani": [
47
+ 11,
48
+ "\u2581<extra_id_92>"
49
+ ],
50
+ "bengali": [
51
+ 46,
52
+ "\u2581<extra_id_57>"
53
+ ],
54
+ "burmese": [
55
+ 37,
56
+ "\u2581<extra_id_66>"
57
+ ],
58
+ "chinese_simplified": [
59
+ 44,
60
+ "\u2581<extra_id_59>"
61
+ ],
62
+ "chinese_traditional": [
63
+ 48,
64
+ "\u2581<extra_id_55>"
65
+ ],
66
+ "czech": [
67
+ 3,
68
+ "\u2581<extra_id_54>"
69
+ ],
70
+ "dutch": [
71
+ 1,
72
+ "\u2581<extra_id_52>"
73
+ ],
74
+ "english": [
75
+ 34,
76
+ "\u2581<extra_id_69>"
77
+ ],
78
+ "french": [
79
+ 14,
80
+ "\u2581<extra_id_89>"
81
+ ],
82
+ "german": [
83
+ 0,
84
+ "\u2581<extra_id_51>"
85
+ ],
86
+ "gujarati": [
87
+ 31,
88
+ "\u2581<extra_id_72>"
89
+ ],
90
+ "hausa": [
91
+ 47,
92
+ "\u2581<extra_id_56>"
93
+ ],
94
+ "hindi": [
95
+ 25,
96
+ "\u2581<extra_id_78>"
97
+ ],
98
+ "igbo": [
99
+ 13,
100
+ "\u2581<extra_id_90>"
101
+ ],
102
+ "indonesian": [
103
+ 5,
104
+ "\u2581<extra_id_98>"
105
+ ],
106
+ "italian": [
107
+ 2,
108
+ "\u2581<extra_id_53>"
109
+ ],
110
+ "japanese": [
111
+ 41,
112
+ "\u2581<extra_id_62>"
113
+ ],
114
+ "kirundi": [
115
+ 4,
116
+ "\u2581<extra_id_99>"
117
+ ],
118
+ "korean": [
119
+ 33,
120
+ "\u2581<extra_id_70>"
121
+ ],
122
+ "kyrgyz": [
123
+ 9,
124
+ "\u2581<extra_id_94>"
125
+ ],
126
+ "marathi": [
127
+ 17,
128
+ "\u2581<extra_id_86>"
129
+ ],
130
+ "nepali": [
131
+ 24,
132
+ "\u2581<extra_id_79>"
133
+ ],
134
+ "oromo": [
135
+ 45,
136
+ "\u2581<extra_id_58>"
137
+ ],
138
+ "pashto": [
139
+ 38,
140
+ "\u2581<extra_id_65>"
141
+ ],
142
+ "persian": [
143
+ 27,
144
+ "\u2581<extra_id_76>"
145
+ ],
146
+ "pidgin": [
147
+ 18,
148
+ "\u2581<extra_id_85>"
149
+ ],
150
+ "portuguese": [
151
+ 43,
152
+ "\u2581<extra_id_60>"
153
+ ],
154
+ "punjabi": [
155
+ 21,
156
+ "\u2581<extra_id_82>"
157
+ ],
158
+ "russian": [
159
+ 40,
160
+ "\u2581<extra_id_63>"
161
+ ],
162
+ "scottish_gaelic": [
163
+ 28,
164
+ "\u2581<extra_id_75>"
165
+ ],
166
+ "serbian_cyrillic": [
167
+ 32,
168
+ "\u2581<extra_id_71>"
169
+ ],
170
+ "serbian_latin": [
171
+ 15,
172
+ "\u2581<extra_id_88>"
173
+ ],
174
+ "sinhala": [
175
+ 35,
176
+ "\u2581<extra_id_68>"
177
+ ],
178
+ "somali": [
179
+ 23,
180
+ "\u2581<extra_id_80>"
181
+ ],
182
+ "spanish": [
183
+ 7,
184
+ "\u2581<extra_id_96>"
185
+ ],
186
+ "swahili": [
187
+ 22,
188
+ "\u2581<extra_id_81>"
189
+ ],
190
+ "tamil": [
191
+ 36,
192
+ "\u2581<extra_id_67>"
193
+ ],
194
+ "telugu": [
195
+ 26,
196
+ "\u2581<extra_id_77>"
197
+ ],
198
+ "thai": [
199
+ 10,
200
+ "\u2581<extra_id_93>"
201
+ ],
202
+ "tigrinya": [
203
+ 20,
204
+ "\u2581<extra_id_83>"
205
+ ],
206
+ "turkish": [
207
+ 19,
208
+ "\u2581<extra_id_84>"
209
+ ],
210
+ "ukrainian": [
211
+ 6,
212
+ "\u2581<extra_id_97>"
213
+ ],
214
+ "urdu": [
215
+ 42,
216
+ "\u2581<extra_id_61>"
217
+ ],
218
+ "uzbek": [
219
+ 12,
220
+ "\u2581<extra_id_91>"
221
+ ],
222
+ "vietnamese": [
223
+ 16,
224
+ "\u2581<extra_id_87>"
225
+ ],
226
+ "welsh": [
227
+ 30,
228
+ "\u2581<extra_id_73>"
229
+ ],
230
+ "yoruba": [
231
+ 29,
232
+ "\u2581<extra_id_74>"
233
+ ]
234
+ }
235
+ },
236
+ "temperature": 0.1,
237
+ "tie_word_embeddings": false,
238
+ "tokenizer_class": "T5Tokenizer",
239
+ "use_cache": true,
240
+ "use_consistency_loss": true,
241
+ "use_cross_alignment_loss": true,
242
+ "use_queue_for_contrastive": true,
243
+ "vocab_size": 250112
244
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:072be6ebd5cbd42c3bd7a1a6ed1ea9f54c8af2a3fd8d9e109d6816fc882d7903
3
+ size 1200773220
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
3
+ size 4309802
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "extra_ids": 0, "additional_special_tokens": null, "special_tokens_map_file": "/root/.cache/huggingface/transformers/685ac0ca8568ec593a48b61b0a3c272beee9bc194a3c7241d15dcadb5f875e53.f76030f3ec1b96a8199b2593390c610e76ca8028ef3d24680000619ffb646276", "tokenizer_file": null, "name_or_path": "./"}