{ | |
"version": "1.0", | |
"truncation": null, | |
"padding": { | |
"strategy": "BatchLongest", | |
"direction": "Right", | |
"pad_to_multiple_of": null, | |
"pad_id": 0, | |
"pad_type_id": 0, | |
"pad_token": "[PAD]" | |
}, | |
"added_tokens": [ | |
{ | |
"id": 0, | |
"content": "[PAD]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 1, | |
"content": "[SOS]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 2, | |
"content": "[EOS]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
} | |
], | |
"normalizer": null, | |
"pre_tokenizer": null, | |
"post_processor": null, | |
"decoder": null, | |
"model": { | |
"type": "BPE", | |
"dropout": null, | |
"unk_token": null, | |
"continuing_subword_prefix": null, | |
"end_of_word_suffix": null, | |
"fuse_unk": false, | |
"byte_fallback": false, | |
"vocab": { | |
"[PAD]": 0, | |
"[SOS]": 1, | |
"[EOS]": 2, | |
"-": 3, | |
"U": 4 | |
}, | |
"merges": [] | |
} | |
} |