|
|
|
|
|
|
|
|
|
model_list: |
|
|
|
- model_name: gpt-4o-mini-northflank |
|
litellm_params: |
|
model: openai/gpt-4o-mini |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
- model_name: gpt-4o-mini |
|
litellm_params: |
|
model: openai/gpt-4o-mini |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
- model_name: gpt-3.5-turbo-northflank |
|
litellm_params: |
|
model: openai/gpt-3.5-turbo |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
- model_name: gpt-3.5-turbo |
|
litellm_params: |
|
model: openai/gpt-3.5-turbo |
|
api_base: https://yc--northflank-duckapi--b69bn8cbbs7k.code.run/v1 |
|
api_key: os.environ/NF_API_KEY |
|
|
|
- model_name: gemini-1.5-pro-k1 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-1.5-pro |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 4 |
|
tpm: 6400 |
|
|
|
- model_name: gemini-1.5-flash-k1 |
|
litellm_params: |
|
model: gemini/gemini-1.5-flash |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
- model_name: gemini-1.5-flash |
|
litellm_params: |
|
model: gemini/gemini-1.5-flash |
|
api_key: os.environ/GEMINI_API_KEY1 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
- model_name: gemini-1.5-pro-k2 |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-1.5-pro |
|
litellm_params: |
|
model: gemini/gemini-1.5-pro |
|
api_key: os.environ/GEMINI_API_KEY |
|
rpm: 4 |
|
tpm: 6400 |
|
|
|
- model_name: gemini-1.5-flash-k2 |
|
litellm_params: |
|
model: gemini/gemini-1.5-flash |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
- model_name: gemini-1.5-flash |
|
litellm_params: |
|
model: gemini/gemini-1.5-flash |
|
api_key: os.environ/GEMINI_API_KEY2 |
|
rpm: 30 |
|
tpm: 2000000 |
|
|
|
litellm_settings: |
|
|
|
request_timeout: 20 |
|
num_retries: 3 |
|
fallbacks: [{"gemini-1.5-pro": ["gemini-1.5-flash"]}] |
|
allowed_fails: 3 |
|
cooldown_time: 30 |
|
drop_params: true |
|
|
|
general_settings: |
|
master_key: os.environ/MASTER_KEY |
|
|
|
router_settings: |
|
fallbacks: [{"gpt-4o-mini": ["gemini-1.5-flash"]}, {"gpt-3.5-turbo": ["gemini-1.5-flash"]}] |
|
model_group_alias: {"gpt-4": "gemini-1.5-pro"} |
|
routing_strategy: simple-shuffle |