| model_list: | |
| - model_name: hf-mistral-7b-instruct-v03 | |
| litellm_params: | |
| model: huggingface/mistralai/Mistral-7B-Instruct-v0.3 | |
| api_key: os.environ/HUGGINGFACE_API_KEY | |
| api_base: "https://api-inference.huggingface.co/" | |
| #api_base: "https://my-endpoint.endpoints.huggingface.cloud" | |
| - model_name: awan-llama3-8b | |
| litellm_params: | |
| model: openai/Meta-Llama-3-8B-Instruct | |
| api_key: os.environ/OTHER_AWANLLM_API_KEY | |
| api_base: https://api.awanllm.com/v1 | |
| rpm: 10 | |
| litellm_settings: | |
| success_callback: ["langfuse"] | |
| failure_callback: ["langfuse"] | |
| num_retries: 3 | |
| request_timeout: 20 | |
| allowed_fails: 3 | |