{ | |
"add_prefix_space": false, | |
"added_tokens_decoder": { | |
"0": { | |
"content": "<unk>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"1": { | |
"content": "<s>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"2": { | |
"content": "</s>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"3": { | |
"content": "<pad>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96499": { | |
"content": "<|start|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96500": { | |
"content": "<|end|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96501": { | |
"content": "<|message|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96502": { | |
"content": "<|tool_start|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96503": { | |
"content": "<|tool_excute|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96504": { | |
"content": "<|tool_end|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96505": { | |
"content": "<|pad|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
}, | |
"96506": { | |
"content": "<|endoftext|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false, | |
"special": true | |
} | |
}, | |
"additional_special_tokens": [ | |
"<|start|>", | |
"<|end|>", | |
"<|message|>", | |
"<|tool_start|>", | |
"<|tool_excute|>", | |
"<|tool_end|>", | |
"<|pad|>", | |
"<|endoftext|>" | |
], | |
"auto_map": { | |
"AutoTokenizer": [ | |
"tokenization_inflm.INFLMTokenizer", | |
null | |
] | |
}, | |
"bos_token": "<s>", | |
"chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{% if not loop.first %}{{ '\\n' }}{% endif %}{{'<|start|>user\\n' + message['content'] + '<|end|>\\n' }}{% if (loop.last and add_generation_prompt) %}{{ '<|start|>assistant<|message|>' }}{% endif %}{% elif message['role'] == 'system' %}{{ '<|start|>system\\n' + message['content'] + '<|end|>' }}{% elif message['role'] == 'assistant' %}{{ '<|start|>assistant<|message|>' + message['content'] + '<|end|>' }}{% endif %}{% endfor %}", | |
"clean_up_tokenization_spaces": false, | |
"eos_token": "</s>", | |
"model_max_length": 1000000000000000019884624838656, | |
"pad_token": "<pad>", | |
"return_tensors": true, | |
"spaces_between_special_tokens": false, | |
"tokenizer_class": "INFLMTokenizer", | |
"unk_token": "<unk>" | |
} | |