|
model_list: |
|
- model_name: gpt-3.5-turbo-end-user-test |
|
litellm_params: |
|
model: gpt-3.5-turbo |
|
region_name: "eu" |
|
model_info: |
|
id: "1" |
|
- model_name: gpt-3.5-turbo-end-user-test |
|
litellm_params: |
|
model: azure/chatgpt-v-2 |
|
api_base: https://openai-gpt-4-test-v-1.openai.azure.com/ |
|
api_version: "2023-05-15" |
|
api_key: os.environ/AZURE_API_KEY |
|
- model_name: gpt-3.5-turbo |
|
litellm_params: |
|
model: azure/chatgpt-v-2 |
|
api_base: https://openai-gpt-4-test-v-1.openai.azure.com/ |
|
api_version: "2023-05-15" |
|
api_key: os.environ/AZURE_API_KEY |
|
- model_name: gpt-3.5-turbo-large |
|
litellm_params: |
|
model: "gpt-3.5-turbo-1106" |
|
api_key: os.environ/OPENAI_API_KEY |
|
rpm: 480 |
|
timeout: 300 |
|
stream_timeout: 60 |
|
- model_name: gpt-4 |
|
litellm_params: |
|
model: azure/chatgpt-v-2 |
|
api_base: https://openai-gpt-4-test-v-1.openai.azure.com/ |
|
api_version: "2023-05-15" |
|
api_key: os.environ/AZURE_API_KEY |
|
rpm: 480 |
|
timeout: 300 |
|
stream_timeout: 60 |
|
- model_name: sagemaker-completion-model |
|
litellm_params: |
|
model: sagemaker/berri-benchmarking-Llama-2-70b-chat-hf-4 |
|
input_cost_per_second: 0.000420 |
|
- model_name: text-embedding-ada-002 |
|
litellm_params: |
|
model: azure/azure-embedding-model |
|
api_key: os.environ/AZURE_API_KEY |
|
api_base: https://openai-gpt-4-test-v-1.openai.azure.com/ |
|
api_version: "2023-05-15" |
|
model_info: |
|
mode: embedding |
|
base_model: text-embedding-ada-002 |
|
- model_name: dall-e-2 |
|
litellm_params: |
|
model: azure/ |
|
api_version: 2023-06-01-preview |
|
api_base: https://openai-gpt-4-test-v-1.openai.azure.com/ |
|
api_key: os.environ/AZURE_API_KEY |
|
- model_name: openai-dall-e-3 |
|
litellm_params: |
|
model: dall-e-3 |
|
- model_name: fake-openai-endpoint |
|
litellm_params: |
|
model: openai/fake |
|
api_key: fake-key |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
- model_name: fake-openai-endpoint-2 |
|
litellm_params: |
|
model: openai/my-fake-model |
|
api_key: my-fake-key |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
stream_timeout: 0.001 |
|
rpm: 1 |
|
- model_name: fake-openai-endpoint-3 |
|
litellm_params: |
|
model: openai/my-fake-model |
|
api_key: my-fake-key |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
stream_timeout: 0.001 |
|
rpm: 1000 |
|
- model_name: fake-openai-endpoint-4 |
|
litellm_params: |
|
model: openai/my-fake-model |
|
api_key: my-fake-key |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
num_retries: 50 |
|
- model_name: fake-openai-endpoint-3 |
|
litellm_params: |
|
model: openai/my-fake-model-2 |
|
api_key: my-fake-key |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
stream_timeout: 0.001 |
|
rpm: 1000 |
|
- model_name: bad-model |
|
litellm_params: |
|
model: openai/bad-model |
|
api_key: os.environ/OPENAI_API_KEY |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
mock_timeout: True |
|
timeout: 60 |
|
rpm: 1000 |
|
model_info: |
|
health_check_timeout: 1 |
|
- model_name: good-model |
|
litellm_params: |
|
model: openai/bad-model |
|
api_key: os.environ/OPENAI_API_KEY |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
rpm: 1000 |
|
model_info: |
|
health_check_timeout: 1 |
|
- model_name: "*" |
|
litellm_params: |
|
model: openai/* |
|
api_key: os.environ/OPENAI_API_KEY |
|
|
|
|
|
|
|
- model_name: "anthropic/*" |
|
litellm_params: |
|
model: "anthropic/*" |
|
api_key: os.environ/ANTHROPIC_API_KEY |
|
- model_name: "bedrock/*" |
|
litellm_params: |
|
model: "bedrock/*" |
|
- model_name: "groq/*" |
|
litellm_params: |
|
model: "groq/*" |
|
api_key: os.environ/GROQ_API_KEY |
|
- model_name: mistral-embed |
|
litellm_params: |
|
model: mistral/mistral-embed |
|
- model_name: gpt-instruct |
|
litellm_params: |
|
model: text-completion-openai/gpt-3.5-turbo-instruct |
|
- model_name: fake-openai-endpoint-5 |
|
litellm_params: |
|
model: openai/my-fake-model |
|
api_key: my-fake-key |
|
api_base: https://exampleopenaiendpoint-production.up.railway.app/ |
|
timeout: 1 |
|
litellm_settings: |
|
|
|
drop_params: True |
|
|
|
|
|
num_retries: 5 |
|
request_timeout: 600 |
|
telemetry: False |
|
context_window_fallbacks: [{"gpt-3.5-turbo": ["gpt-3.5-turbo-large"]}] |
|
default_team_settings: |
|
- team_id: team-1 |
|
success_callback: ["langfuse"] |
|
failure_callback: ["langfuse"] |
|
langfuse_public_key: os.environ/LANGFUSE_PROJECT1_PUBLIC |
|
langfuse_secret: os.environ/LANGFUSE_PROJECT1_SECRET |
|
- team_id: team-2 |
|
success_callback: ["langfuse"] |
|
failure_callback: ["langfuse"] |
|
langfuse_public_key: os.environ/LANGFUSE_PROJECT2_PUBLIC |
|
langfuse_secret: os.environ/LANGFUSE_PROJECT2_SECRET |
|
langfuse_host: https://us.cloud.langfuse.com |
|
|
|
|
|
finetune_settings: |
|
- custom_llm_provider: azure |
|
api_base: os.environ/AZURE_API_BASE |
|
api_key: os.environ/AZURE_API_KEY |
|
api_version: "2023-03-15-preview" |
|
- custom_llm_provider: openai |
|
api_key: os.environ/OPENAI_API_KEY |
|
|
|
|
|
files_settings: |
|
- custom_llm_provider: azure |
|
api_base: os.environ/AZURE_API_BASE |
|
api_key: os.environ/AZURE_API_KEY |
|
api_version: "2023-03-15-preview" |
|
- custom_llm_provider: openai |
|
api_key: os.environ/OPENAI_API_KEY |
|
|
|
router_settings: |
|
routing_strategy: usage-based-routing-v2 |
|
redis_host: os.environ/REDIS_HOST |
|
redis_password: os.environ/REDIS_PASSWORD |
|
redis_port: os.environ/REDIS_PORT |
|
enable_pre_call_checks: true |
|
model_group_alias: {"my-special-fake-model-alias-name": "fake-openai-endpoint-3"} |
|
|
|
general_settings: |
|
master_key: sk-1234 |
|
store_model_in_db: True |
|
proxy_budget_rescheduler_min_time: 60 |
|
proxy_budget_rescheduler_max_time: 64 |
|
proxy_batch_write_at: 1 |
|
database_connection_pool_limit: 10 |
|
|
|
|
|
pass_through_endpoints: |
|
- path: "/v1/rerank" |
|
target: "https://api.cohere.com/v1/rerank" |
|
headers: |
|
content-type: application/json |
|
accept: application/json |
|
forward_headers: True |
|
|
|
|
|
|
|
|
|
|
|
|
|
|