|
|
|
|
|
|
|
|
|
model_list: |
|
|
|
- model_name: gpt-4o-mini-northflank |
|
litellm_params: |
|
model: openai/gpt-4o-mini |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
- model_name: gpt-4o-mini |
|
litellm_params: |
|
model: openai/gpt-4o-mini |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
- model_name: gpt-3.5-turbo-northflank |
|
litellm_params: |
|
model: openai/gpt-3.5-turbo |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
- model_name: gpt-3.5-turbo |
|
litellm_params: |
|
model: openai/gpt-3.5-turbo |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
|
|
|
|
- model_name: gpt-4o-k1 |
|
litellm_params: |
|
model: github/gpt-4o |
|
api_base: https://models.inference.ai.azure.com |
|
api_key: os.environ/GITHUB_API_KEY1 |
|
- model_name: github/gpt-4o |
|
litellm_params: |
|
model: github/gpt-4o |
|
api_key: os.environ/GITHUB_API_KEY1 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
- model_name: gpt-4o-k2 |
|
litellm_params: |
|
model: github/gpt-4o |
|
api_base: https://models.inference.ai.azure.com |
|
api_key: os.environ/GITHUB_API_KEY2 |
|
- model_name: github/gpt-4o |
|
litellm_params: |
|
model: github/gpt-4o |
|
api_key: os.environ/GITHUB_API_KEY2 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
- model_name: Mistral-large-2411-k1 |
|
litellm_params: |
|
model: github/Mistral-large-2411 |
|
api_base: https://models.inference.ai.azure.com |
|
api_key: os.environ/GITHUB_API_KEY1 |
|
- model_name: github/Mistral-large-2411 |
|
litellm_params: |
|
model: github/Mistral-large-2411 |
|
api_key: os.environ/GITHUB_API_KEY1 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
- model_name: Mistral-large-2411-k2 |
|
litellm_params: |
|
model: github/Mistral-large-2411 |
|
api_base: https://models.inference.ai.azure.com |
|
api_key: os.environ/GITHUB_API_KEY2 |
|
- model_name: github/Mistral-large-2411 |
|
litellm_params: |
|
model: github/Mistral-large-2411 |
|
api_key: os.environ/GITHUB_API_KEY2 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
- model_name: gpt-4o-mini-k1 |
|
litellm_params: |
|
model: github/gpt-4o-mini |
|
api_base: https://models.inference.ai.azure.com |
|
api_key: os.environ/GITHUB_API_KEY1 |
|
- model_name: github/gpt-4o-mini |
|
litellm_params: |
|
model: github/gpt-4o-mini |
|
api_key: os.environ/GITHUB_API_KEY1 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
- model_name: gpt-4o-mini-k2 |
|
litellm_params: |
|
model: github/gpt-4o-mini |
|
api_base: https://models.inference.ai.azure.com |
|
api_key: os.environ/GITHUB_API_KEY2 |
|
- model_name: github/gpt-4o-mini |
|
litellm_params: |
|
model: github/gpt-4o-mini |
|
api_key: os.environ/GITHUB_API_KEY2 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
|
|
- model_name: gemini-1.5-pro-k1 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-1.5-pro |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 4 |
|
tpm: 6400 |
|
- model_name: gemini-1.5-pro-k2 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-1.5-pro |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY |
|
rpm: 4 |
|
tpm: 6400 |
|
|
|
- model_name: gemini-1.5-pro-002-k1 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro-002 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-1.5-pro-002 |
|
litellm_params: |
|
model: gemini/gemini-1.5-flash-002 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 75 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-1.5-pro-002-k2 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro-002 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-1.5-pro-002 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro-002 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 75 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-1.5-pro-exp-k1 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro-exp |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-1.5-pro-exp |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro-exp |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 75 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-1.5-pro-exp-k2 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro-exp |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-1.5-pro-exp |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro-exp |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 75 |
|
tpm: 5000000 |
|
|
|
|
|
- model_name: gemini-2.0-flash-exp-k1 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-exp |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-2.0-flash-exp |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-exp |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 50 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-2.0-flash-exp-k2 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-exp |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-2.0-flash-exp |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-exp |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 50 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-2.0-flash-thinking-exp-k1 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-2.0-flash-thinking-exp |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 50 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-2.0-flash-thinking-exp-k2 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-2.0-flash-thinking-exp |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 50 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-2.0-flash-thinking-exp-1219-k1 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp-1219 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-2.0-flash-thinking-exp-1219 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp-1219 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 50 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-2.0-flash-thinking-exp-1219-k2 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp-1219 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-2.0-flash-thinking-exp-1219 |
|
litellm_params: |
|
model: gemini/gemini-2.0-flash-thinking-exp-1219 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 50 |
|
tpm: 5000000 |
|
|
|
|
|
- model_name: gemini-exp-1206-k1 |
|
litellm_params: |
|
model: gemini/gemini-exp-1206 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-exp-1206 |
|
litellm_params: |
|
model: gemini/gemini-exp-1206 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 20 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-exp-1206-k2 |
|
litellm_params: |
|
model: gemini/gemini-exp-1206 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-exp-1206 |
|
litellm_params: |
|
model: gemini/gemini-exp-1206 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 20 |
|
tpm: 5000000 |
|
|
|
|
|
- model_name: gemini-exp-1121-k1 |
|
litellm_params: |
|
model: gemini/gemini-exp-1121 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-exp-1121 |
|
litellm_params: |
|
model: gemini/gemini-exp-1121 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 20 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-exp-1121-k2 |
|
litellm_params: |
|
model: gemini/gemini-exp-1121 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-exp-1121 |
|
litellm_params: |
|
model: gemini/gemini-exp-1121 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 20 |
|
tpm: 5000000 |
|
|
|
|
|
- model_name: gemini-exp-1114-k1 |
|
litellm_params: |
|
model: gemini/gemini-exp-1114 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-exp-1114 |
|
litellm_params: |
|
model: gemini/gemini-exp-1114 |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 20 |
|
tpm: 5000000 |
|
|
|
- model_name: gemini-exp-1114-k2 |
|
litellm_params: |
|
model: gemini/gemini-exp-1114 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-exp-1114 |
|
litellm_params: |
|
model: gemini/gemini-exp-1114 |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 20 |
|
tpm: 5000000 |
|
|
|
litellm_settings: |
|
|
|
request_timeout: 20 |
|
num_retries: 3 |
|
fallbacks: [{"gemini-1.5-pro": ["gemini-1.5-flash"]}] |
|
allowed_fails: 3 |
|
cooldown_time: 30 |
|
drop_params: true |
|
|
|
general_settings: |
|
master_key: os.environ/MASTER_KEY |
|
|
|
router_settings: |
|
fallbacks: [{"gpt-4o-mini": ["gemini-1.5-flash"]}, {"gpt-3.5-turbo": ["gemini-1.5-flash"]}] |
|
model_group_alias: {"gpt-4": "gemini-1.5-pro"} |
|
routing_strategy: simple-shuffle |