Fixed litellm
This commit is contained in:
@@ -4,13 +4,15 @@
|
|||||||
# logo: svgs/litellm.svg
|
# logo: svgs/litellm.svg
|
||||||
# port: 4000
|
# port: 4000
|
||||||
|
|
||||||
|
version: "3"
|
||||||
|
|
||||||
volumes:
|
volumes:
|
||||||
pg-data: null
|
pg_data: null
|
||||||
redis-data: null
|
redis_data: null
|
||||||
|
|
||||||
services:
|
services:
|
||||||
litellm:
|
litellm:
|
||||||
image: "ghcr.io/berriai/litellm-database:main-latest"
|
image: "ghcr.io/berriai/litellm-database:main-stable"
|
||||||
restart: always
|
restart: always
|
||||||
depends_on:
|
depends_on:
|
||||||
postgres:
|
postgres:
|
||||||
@@ -18,9 +20,10 @@ services:
|
|||||||
redis:
|
redis:
|
||||||
condition: service_healthy
|
condition: service_healthy
|
||||||
environment:
|
environment:
|
||||||
|
- SERVICE_FQDN_LITELLM_4000
|
||||||
- LITELLM_LOG=ERROR
|
- LITELLM_LOG=ERROR
|
||||||
- LITELLM_MODE=PRODUCTION
|
- LITELLM_MODE=PRODUCTION
|
||||||
- "LITELLM_MASTER_KEY=${SERVICE_PASSWORD_32_LITELLM_MASTER_KEY}"
|
- "LITELLM_MASTER_KEY=${SERVICE_PASSWORD_MASTERKEY}"
|
||||||
- "UI_USERNAME=${SERVICE_USER_UI}"
|
- "UI_USERNAME=${SERVICE_USER_UI}"
|
||||||
- "UI_PASSWORD=${SERVICE_PASSWORD_UI}"
|
- "UI_PASSWORD=${SERVICE_PASSWORD_UI}"
|
||||||
- "DATABASE_URL=postgresql://${SERVICE_USER_POSTGRES}:${SERVICE_PASSWORD_POSTGRES}@postgres:5432/${POSTGRES_DB:-litellm}"
|
- "DATABASE_URL=postgresql://${SERVICE_USER_POSTGRES}:${SERVICE_PASSWORD_POSTGRES}@postgres:5432/${POSTGRES_DB:-litellm}"
|
||||||
@@ -36,16 +39,14 @@ services:
|
|||||||
- "VOYAGE_API_KEY=${VOYAGE_API_KEY}"
|
- "VOYAGE_API_KEY=${VOYAGE_API_KEY}"
|
||||||
- "VOYAGE_API_BASE=${VOYAGE_API_BASE}"
|
- "VOYAGE_API_BASE=${VOYAGE_API_BASE}"
|
||||||
volumes:
|
volumes:
|
||||||
- "./litellm-config.yaml:/app/config.yaml"
|
|
||||||
- type: bind
|
- type: bind
|
||||||
source: ./docker/app/config.yaml
|
source: ./litellm-config.yaml
|
||||||
target: /app/config.yaml
|
target: /app/config.yaml
|
||||||
content: |
|
content: |
|
||||||
general_settings:
|
general_settings:
|
||||||
proxy_batch_write_at: 60
|
proxy_batch_write_at: 60
|
||||||
|
|
||||||
router_settings:
|
router_settings:
|
||||||
routing_strategy: usage-based-routing-v2
|
|
||||||
redis_host: os.environ/REDIS_HOST
|
redis_host: os.environ/REDIS_HOST
|
||||||
redis_port: os.environ/REDIS_PORT
|
redis_port: os.environ/REDIS_PORT
|
||||||
redis_password: os.environ/REDIS_PASSWORD
|
redis_password: os.environ/REDIS_PASSWORD
|
||||||
@@ -57,6 +58,7 @@ services:
|
|||||||
log_raw_request_response: true
|
log_raw_request_response: true
|
||||||
# turn_off_message_logging: false
|
# turn_off_message_logging: false
|
||||||
# redact_user_api_key_info: false
|
# redact_user_api_key_info: false
|
||||||
|
service_callback: ["prometheus_system"]
|
||||||
drop_params: true
|
drop_params: true
|
||||||
# max_budget: 100
|
# max_budget: 100
|
||||||
# budget_duration: 30d
|
# budget_duration: 30d
|
||||||
@@ -71,19 +73,14 @@ services:
|
|||||||
password: os.environ/REDIS_PASSWORD
|
password: os.environ/REDIS_PASSWORD
|
||||||
namespace: "litellm_cache"
|
namespace: "litellm_cache"
|
||||||
ttl: 600
|
ttl: 600
|
||||||
# success_callback:
|
success_callback:
|
||||||
# - "langfuse"
|
# - "langfuse"
|
||||||
# - "prometheus"
|
- "prometheus"
|
||||||
# failure_callback:
|
failure_callback:
|
||||||
# - "langfuse"
|
# - "langfuse"
|
||||||
# - "prometheus"
|
- "prometheus"
|
||||||
model_list:
|
model_list:
|
||||||
# OpenAI
|
# OpenAI
|
||||||
- model_name: gpt-3.5-turbo
|
|
||||||
litellm_params:
|
|
||||||
model: openai/gpt-3.5-turbo
|
|
||||||
api_key: os.environ/OPENAI_API_KEY
|
|
||||||
api_base: os.environ/OPENAI_API_BASE
|
|
||||||
- model_name: gpt-4
|
- model_name: gpt-4
|
||||||
litellm_params:
|
litellm_params:
|
||||||
model: openai/gpt-4
|
model: openai/gpt-4
|
||||||
@@ -118,8 +115,8 @@ services:
|
|||||||
model: voyage/voyage-law-2
|
model: voyage/voyage-law-2
|
||||||
api_key: "os.environ/VOYAGE_API_KEY"
|
api_key: "os.environ/VOYAGE_API_KEY"
|
||||||
api_base: "os.environ/VOYAGE_API_BASE"
|
api_base: "os.environ/VOYAGE_API_BASE"
|
||||||
rpm: 300
|
# rpm: 300
|
||||||
tpm: 1000000
|
# tpm: 1000000
|
||||||
- model_name: voyage-multilingual-2
|
- model_name: voyage-multilingual-2
|
||||||
model_info:
|
model_info:
|
||||||
mode: embedding
|
mode: embedding
|
||||||
@@ -132,8 +129,8 @@ services:
|
|||||||
api_base: "os.environ/VOYAGE_API_BASE"
|
api_base: "os.environ/VOYAGE_API_BASE"
|
||||||
input_cost_per_token: 0.00000012
|
input_cost_per_token: 0.00000012
|
||||||
output_cost_per_token: 0
|
output_cost_per_token: 0
|
||||||
rpm: 300
|
# rpm: 300
|
||||||
tpm: 1000000
|
# tpm: 1000000
|
||||||
healthcheck:
|
healthcheck:
|
||||||
test:
|
test:
|
||||||
- CMD
|
- CMD
|
||||||
@@ -157,7 +154,7 @@ services:
|
|||||||
- POSTGRES_PASSWORD=$SERVICE_PASSWORD_POSTGRES
|
- POSTGRES_PASSWORD=$SERVICE_PASSWORD_POSTGRES
|
||||||
- POSTGRES_USER=$SERVICE_USER_POSTGRES
|
- POSTGRES_USER=$SERVICE_USER_POSTGRES
|
||||||
volumes:
|
volumes:
|
||||||
- "pg-data:/var/lib/postgresql/data"
|
- "pg_data:/var/lib/postgresql/data"
|
||||||
healthcheck:
|
healthcheck:
|
||||||
test:
|
test:
|
||||||
- CMD-SHELL
|
- CMD-SHELL
|
||||||
@@ -169,7 +166,7 @@ services:
|
|||||||
image: redis:7-alpine
|
image: redis:7-alpine
|
||||||
command: redis-server --appendonly yes
|
command: redis-server --appendonly yes
|
||||||
volumes:
|
volumes:
|
||||||
- redis-data:/data
|
- redis_data:/data
|
||||||
healthcheck:
|
healthcheck:
|
||||||
test: ["CMD", "redis-cli", "ping"]
|
test: ["CMD", "redis-cli", "ping"]
|
||||||
interval: 5s
|
interval: 5s
|
||||||
|
|||||||
Reference in New Issue
Block a user