{"unk_token": "<|endoftext|>", "bos_token": "<|endoftext|>", "eos_token": "<|endoftext|>", "add_prefix_space": false, "special_tokens_map_file": null, "name_or_path": "data/gpt2_oscar_unshuffled_deduplicated_de_without_4gb_valid/bigs/hf_checkpoints/global_step100000", "tokenizer_class": "GPT2Tokenizer"} |