Spaces:
Sleeping
Sleeping
Create litellm_config.yaml
Browse files- litellm_config.yaml +20 -0
litellm_config.yaml
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model_list:
|
| 2 |
+
- model_name: hf-mistral-7b-instruct-v03
|
| 3 |
+
litellm_params:
|
| 4 |
+
model: huggingface/mistralai/Mistral-7B-Instruct-v0.3
|
| 5 |
+
api_key: os.environ/HUGGINGFACE_API_KEY
|
| 6 |
+
api_base: "https://api-inference.huggingface.co/"
|
| 7 |
+
#api_base: "https://my-endpoint.endpoints.huggingface.cloud"
|
| 8 |
+
- model_name: awan-llama3-8b
|
| 9 |
+
litellm_params:
|
| 10 |
+
model: openai/Meta-Llama-3-8B-Instruct
|
| 11 |
+
api_key: os.environ/OTHER_AWANLLM_API_KEY
|
| 12 |
+
api_base: https://api.awanllm.com/v1
|
| 13 |
+
rpm: 10
|
| 14 |
+
|
| 15 |
+
litellm_settings:
|
| 16 |
+
success_callback: ["langfuse"]
|
| 17 |
+
failure_callback: ["langfuse"]
|
| 18 |
+
num_retries: 3
|
| 19 |
+
request_timeout: 20
|
| 20 |
+
allowed_fails: 3
|