Llama-2-70b-hf-v16-k65536-65536-woft / generation_config.json
OpenSourceRonin's picture
Upload model Llama-2-70b-hf-v16-k65536-65536-woft
2f5956c verified
{
"attn_implementation": "flash_attention_2",
"bos_token_id": 1,
"do_sample": true,
"eos_token_id": 2,
"max_length": 4096,
"num_assistant_tokens": 5,
"num_assistant_tokens_schedule": "heuristic",
"pad_token_id": 0,
"return_legacy_cache": true,
"temperature": 0.6,
"top_p": 0.9,
"transformers_version": "4.45.1"
}