29 lines
814 B
YAML
29 lines
814 B
YAML
apiVersion: v1
|
|
kind: ConfigMap
|
|
metadata:
|
|
name: litellm-config
|
|
namespace: ai-core
|
|
data:
|
|
config.yaml: |
|
|
model_list:
|
|
- model_name: ollama-qwen
|
|
litellm_params:
|
|
model: ollama/qwen2.5:14b
|
|
api_base: http://ollama.ai-core.svc.cluster.local:11434
|
|
- model_name: ollama-gemma
|
|
litellm_params:
|
|
model: ollama/gemma:7b
|
|
api_base: http://ollama.ai-core.svc.cluster.local:11434
|
|
router_settings:
|
|
routing_strategy: simple-shuffle
|
|
num_retries: 2
|
|
timeout: 120
|
|
allowed_fails: 2
|
|
context_window_fallbacks:
|
|
- ollama-qwen
|
|
- ollama-gemma
|
|
litellm_settings:
|
|
max_budget: 5
|
|
budget_duration: 1d
|
|
# Virtual keys / teams: use $20/day for dev-agent keys in LiteLLM admin or separate deployment profile.
|