- Add `ai` compose profile — Ollama + LiteLLM containers for local dev
when Agap shared services are unavailable; use with LITELLM_URL /
OLLAMA_URL env vars pointing ml-serving at localhost
- Mark #90 done (LLM schema validation + fallback shipped in 85a332b)
- Mark #80 superseded by ADR-0013 (multi-agent orchestrator is the pipeline)
Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
@@ -82,6 +82,46 @@ services:
|
||||
timeout: 5s
|
||||
retries: 5
|
||||
|
||||
# ── ai profile — Ollama + LiteLLM for local dev ──────────────────────────
|
||||
# Start: docker compose --profile ai up
|
||||
# Use when the Agap shared Ollama/LiteLLM services are not available locally.
|
||||
# Set LITELLM_URL=http://localhost:4000 and OLLAMA_URL=http://localhost:11434
|
||||
# in .env.local to point ml-serving at these containers instead of Agap.
|
||||
|
||||
ollama:
|
||||
image: ollama/ollama:latest
|
||||
profiles: [ai]
|
||||
volumes:
|
||||
- ollama-models:/root/.ollama
|
||||
ports:
|
||||
- "127.0.0.1:11434:11434"
|
||||
healthcheck:
|
||||
test: ["CMD", "curl", "-sf", "http://localhost:11434/api/tags"]
|
||||
interval: 15s
|
||||
timeout: 5s
|
||||
retries: 10
|
||||
|
||||
litellm:
|
||||
image: ghcr.io/berriai/litellm:main-latest
|
||||
profiles: [ai]
|
||||
environment:
|
||||
LITELLM_MASTER_KEY: ${LITELLM_MASTER_KEY:-sk-local-dev}
|
||||
command: >
|
||||
--model ollama/qwen2.5:1.5b
|
||||
--model ollama/nomic-embed-text
|
||||
--api_base http://ollama:11434
|
||||
--port 4000
|
||||
ports:
|
||||
- "127.0.0.1:4000:4000"
|
||||
depends_on:
|
||||
ollama:
|
||||
condition: service_healthy
|
||||
healthcheck:
|
||||
test: ["CMD", "curl", "-sf", "http://localhost:4000/health"]
|
||||
interval: 10s
|
||||
timeout: 5s
|
||||
retries: 5
|
||||
|
||||
# ── mlops profile — MLflow ────────────────────────────────────────────────
|
||||
# Start: docker compose --profile mlops up
|
||||
# MLflow UI: http://localhost:5000 or https://o.alogins.net/mlflow
|
||||
@@ -129,3 +169,6 @@ services:
|
||||
interval: 10s
|
||||
timeout: 5s
|
||||
retries: 5
|
||||
|
||||
volumes:
|
||||
ollama-models:
|
||||
|
||||
Reference in New Issue
Block a user