litellm / litellm_config.yaml
lemonteaa's picture
Create litellm_config.yaml
f5aec1b verified
raw
history blame
648 Bytes
model_list:
- model_name: hf-mistral-7b-instruct-v03
litellm_params:
model: huggingface/mistralai/Mistral-7B-Instruct-v0.3
api_key: os.environ/HUGGINGFACE_API_KEY
api_base: "https://api-inference.huggingface.co/"
#api_base: "https://my-endpoint.endpoints.huggingface.cloud"
- model_name: awan-llama3-8b
litellm_params:
model: openai/Meta-Llama-3-8B-Instruct
api_key: os.environ/OTHER_AWANLLM_API_KEY
api_base: https://api.awanllm.com/v1
rpm: 10
litellm_settings:
success_callback: ["langfuse"]
failure_callback: ["langfuse"]
num_retries: 3
request_timeout: 20
allowed_fails: 3