Added LiteLLM as an OpenAI-compatible proxy for Anthropic's API to enable Claude models in Open WebUI. **New Service: litellm** - Image: ghcr.io/berriai/litellm:main-latest - Internal proxy on port 4000 - Converts Anthropic API to OpenAI-compatible format - Health check with 30s intervals - Not exposed via Traefik (internal only) **LiteLLM Configuration (litellm-config.yaml)** - Claude Sonnet 4 (claude-sonnet-4-20250514) - Claude Sonnet 4.5 (claude-sonnet-4-5-20250929) - Claude 3.5 Sonnet (claude-3-5-sonnet-20241022) - Claude 3 Opus (claude-3-opus-20240229) - Claude 3 Haiku (claude-3-haiku-20240307) **Open WebUI Configuration Updates** - Changed OPENAI_API_BASE_URLS to point to LiteLLM proxy - URL: http://litellm:4000/v1 - Added litellm as dependency for webui service - Dummy API key for proxy authentication **Why LiteLLM?** Anthropic's API uses different endpoint structure and authentication headers compared to OpenAI. LiteLLM acts as a translation layer, allowing Open WebUI to use Claude models through its OpenAI-compatible interface. **Available Models in Open WebUI** - claude-sonnet-4 (latest Claude Sonnet 4) - claude-sonnet-4.5 (Claude Sonnet 4.5) - claude-3-5-sonnet - claude-3-opus - claude-3-haiku 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
147 lines
5.3 KiB
YAML
147 lines
5.3 KiB
YAML
services:
|
|
# PostgreSQL with pgvector for AI/RAG workloads
|
|
ai_postgres:
|
|
image: ${AI_POSTGRES_IMAGE:-pgvector/pgvector:pg16}
|
|
container_name: ${AI_COMPOSE_PROJECT_NAME}_postgres
|
|
restart: unless-stopped
|
|
environment:
|
|
TZ: ${TIMEZONE:-Europe/Berlin}
|
|
POSTGRES_USER: ${AI_DB_USER}
|
|
POSTGRES_PASSWORD: ${AI_DB_PASSWORD}
|
|
POSTGRES_DB: ${AI_DB_NAME}
|
|
POSTGRES_HOST_AUTH_METHOD: scram-sha-256
|
|
POSTGRES_INITDB_ARGS: --auth-host=scram-sha-256
|
|
volumes:
|
|
- ai_postgres_data:/var/lib/postgresql/data
|
|
healthcheck:
|
|
test: ["CMD-SHELL", "pg_isready -U ${AI_DB_USER}"]
|
|
interval: 30s
|
|
timeout: 10s
|
|
retries: 3
|
|
start_period: 40s
|
|
networks:
|
|
- compose_network
|
|
|
|
# Open WebUI - ChatGPT-like interface for AI models
|
|
webui:
|
|
image: ${AI_WEBUI_IMAGE:-ghcr.io/open-webui/open-webui:main}
|
|
container_name: ${AI_COMPOSE_PROJECT_NAME}_webui
|
|
restart: unless-stopped
|
|
environment:
|
|
TZ: ${TIMEZONE:-Europe/Berlin}
|
|
|
|
# Database configuration
|
|
DATABASE_URL: postgresql://${AI_DB_USER}:${AI_DB_PASSWORD}@ai_postgres:5432/${AI_DB_NAME}
|
|
|
|
# OpenAI API configuration (pointing to LiteLLM proxy)
|
|
OPENAI_API_BASE_URLS: http://litellm:4000/v1
|
|
OPENAI_API_KEYS: sk-1234 # Dummy key for LiteLLM proxy
|
|
|
|
# WebUI configuration
|
|
WEBUI_NAME: ${AI_WEBUI_NAME:-Pivoine AI}
|
|
WEBUI_URL: https://${AI_TRAEFIK_HOST}
|
|
WEBUI_SECRET_KEY: ${AI_WEBUI_SECRET_KEY}
|
|
|
|
# Feature flags
|
|
ENABLE_SIGNUP: ${AI_ENABLE_SIGNUP:-true}
|
|
ENABLE_RAG_WEB_SEARCH: ${AI_ENABLE_RAG_WEB_SEARCH:-true}
|
|
ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION: ${AI_ENABLE_RAG_SSL_VERIFY:-true}
|
|
|
|
# RAG configuration
|
|
RAG_EMBEDDING_ENGINE: ${AI_RAG_EMBEDDING_ENGINE:-openai}
|
|
RAG_EMBEDDING_MODEL: ${AI_RAG_EMBEDDING_MODEL:-text-embedding-3-small}
|
|
VECTOR_DB: ${AI_VECTOR_DB:-pgvector}
|
|
|
|
# Email configuration (IONOS SMTP)
|
|
SMTP_HOST: ${EMAIL_SMTP_HOST}
|
|
SMTP_PORT: ${EMAIL_SMTP_PORT}
|
|
SMTP_USER: ${EMAIL_SMTP_USER}
|
|
SMTP_PASSWORD: ${EMAIL_SMTP_PASSWORD}
|
|
SMTP_FROM_EMAIL: ${EMAIL_FROM}
|
|
SMTP_USE_TLS: false
|
|
SMTP_USE_SSL: true
|
|
|
|
volumes:
|
|
- ai_webui_data:/app/backend/data
|
|
depends_on:
|
|
- ai_postgres
|
|
- litellm
|
|
networks:
|
|
- compose_network
|
|
labels:
|
|
- 'traefik.enable=${AI_TRAEFIK_ENABLED}'
|
|
# HTTP to HTTPS redirect
|
|
- 'traefik.http.middlewares.${AI_COMPOSE_PROJECT_NAME}-redirect-web-secure.redirectscheme.scheme=https'
|
|
- 'traefik.http.routers.${AI_COMPOSE_PROJECT_NAME}-web.middlewares=${AI_COMPOSE_PROJECT_NAME}-redirect-web-secure'
|
|
- 'traefik.http.routers.${AI_COMPOSE_PROJECT_NAME}-web.rule=Host(`${AI_TRAEFIK_HOST}`)'
|
|
- 'traefik.http.routers.${AI_COMPOSE_PROJECT_NAME}-web.entrypoints=web'
|
|
# HTTPS router
|
|
- 'traefik.http.routers.${AI_COMPOSE_PROJECT_NAME}-web-secure.rule=Host(`${AI_TRAEFIK_HOST}`)'
|
|
- 'traefik.http.routers.${AI_COMPOSE_PROJECT_NAME}-web-secure.tls.certresolver=resolver'
|
|
- 'traefik.http.routers.${AI_COMPOSE_PROJECT_NAME}-web-secure.entrypoints=web-secure'
|
|
- 'traefik.http.middlewares.${AI_COMPOSE_PROJECT_NAME}-web-secure-compress.compress=true'
|
|
- 'traefik.http.routers.${AI_COMPOSE_PROJECT_NAME}-web-secure.middlewares=${AI_COMPOSE_PROJECT_NAME}-web-secure-compress,security-headers@file'
|
|
# Service
|
|
- 'traefik.http.services.${AI_COMPOSE_PROJECT_NAME}-web-secure.loadbalancer.server.port=8080'
|
|
- 'traefik.docker.network=${NETWORK_NAME}'
|
|
# Watchtower
|
|
- 'com.centurylinklabs.watchtower.enable=${WATCHTOWER_LABEL_ENABLE}'
|
|
|
|
# LiteLLM - Proxy to convert Anthropic API to OpenAI-compatible format
|
|
litellm:
|
|
image: ghcr.io/berriai/litellm:main-latest
|
|
container_name: ${AI_COMPOSE_PROJECT_NAME}_litellm
|
|
restart: unless-stopped
|
|
environment:
|
|
TZ: ${TIMEZONE:-Europe/Berlin}
|
|
ANTHROPIC_API_KEY: ${ANTHROPIC_API_KEY}
|
|
LITELLM_MASTER_KEY: ${AI_WEBUI_SECRET_KEY}
|
|
volumes:
|
|
- ./ai/litellm-config.yaml:/app/config.yaml:ro
|
|
command: ["--config", "/app/config.yaml", "--port", "4000", "--num_workers", "1"]
|
|
networks:
|
|
- compose_network
|
|
healthcheck:
|
|
test: ["CMD-SHELL", "curl -f http://localhost:4000/health || exit 1"]
|
|
interval: 30s
|
|
timeout: 10s
|
|
retries: 3
|
|
start_period: 20s
|
|
labels:
|
|
# No Traefik exposure - internal only
|
|
- 'traefik.enable=false'
|
|
# Watchtower
|
|
- 'com.centurylinklabs.watchtower.enable=${WATCHTOWER_LABEL_ENABLE}'
|
|
|
|
# Crawl4AI - Web scraping for LLMs (internal API, no public access)
|
|
crawl4ai:
|
|
image: ${AI_CRAWL4AI_IMAGE:-unclecode/crawl4ai:latest}
|
|
container_name: ${AI_COMPOSE_PROJECT_NAME}_crawl4ai
|
|
restart: unless-stopped
|
|
environment:
|
|
TZ: ${TIMEZONE:-Europe/Berlin}
|
|
# API configuration
|
|
PORT: ${AI_CRAWL4AI_PORT:-11235}
|
|
volumes:
|
|
- ai_crawl4ai_data:/app/.crawl4ai
|
|
networks:
|
|
- compose_network
|
|
labels:
|
|
# No Traefik exposure - internal only
|
|
- 'traefik.enable=false'
|
|
# Watchtower
|
|
- 'com.centurylinklabs.watchtower.enable=${WATCHTOWER_LABEL_ENABLE}'
|
|
|
|
volumes:
|
|
ai_postgres_data:
|
|
name: ${AI_COMPOSE_PROJECT_NAME}_postgres_data
|
|
ai_webui_data:
|
|
name: ${AI_COMPOSE_PROJECT_NAME}_webui_data
|
|
ai_crawl4ai_data:
|
|
name: ${AI_COMPOSE_PROJECT_NAME}_crawl4ai_data
|
|
|
|
networks:
|
|
compose_network:
|
|
name: ${NETWORK_NAME}
|
|
external: true
|