chore(m2): close out remaining loose ends (#80, #86, #90)

- Add `ai` compose profile — Ollama + LiteLLM containers for local dev when Agap shared services are unavailable; use with LITELLM_URL / OLLAMA_URL env vars pointing ml-serving at localhost - Mark #90 done (LLM schema validation + fallback shipped in 85a332b) - Mark #80 superseded by ADR-0013 (multi-agent orchestrator is the pipeline) Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-05-12 15:31:25 +00:00
parent 85a332b22b
commit 8fd08379d7
2 changed files with 46 additions and 3 deletions
--- a/infra/docker/docker-compose.yml
+++ b/infra/docker/docker-compose.yml
@@ -82,6 +82,46 @@ services:
      timeout: 5s
      retries: 5

+  # ── ai profile — Ollama + LiteLLM for local dev ──────────────────────────
+  # Start: docker compose --profile ai up
+  # Use when the Agap shared Ollama/LiteLLM services are not available locally.
+  # Set LITELLM_URL=http://localhost:4000 and OLLAMA_URL=http://localhost:11434
+  # in .env.local to point ml-serving at these containers instead of Agap.
+
+  ollama:
+    image: ollama/ollama:latest
+    profiles: [ai]
+    volumes:
+      - ollama-models:/root/.ollama
+    ports:
+      - "127.0.0.1:11434:11434"
+    healthcheck:
+      test: ["CMD", "curl", "-sf", "http://localhost:11434/api/tags"]
+      interval: 15s
+      timeout: 5s
+      retries: 10
+
+  litellm:
+    image: ghcr.io/berriai/litellm:main-latest
+    profiles: [ai]
+    environment:
+      LITELLM_MASTER_KEY: ${LITELLM_MASTER_KEY:-sk-local-dev}
+    command: >
+      --model ollama/qwen2.5:1.5b
+      --model ollama/nomic-embed-text
+      --api_base http://ollama:11434
+      --port 4000
+    ports:
+      - "127.0.0.1:4000:4000"
+    depends_on:
+      ollama:
+        condition: service_healthy
+    healthcheck:
+      test: ["CMD", "curl", "-sf", "http://localhost:4000/health"]
+      interval: 10s
+      timeout: 5s
+      retries: 5
+
  # ── mlops profile — MLflow ────────────────────────────────────────────────
  # Start: docker compose --profile mlops up
  # MLflow UI:  http://localhost:5000  or  https://o.alogins.net/mlflow
@@ -129,3 +169,6 @@ services:
      interval: 10s
      timeout: 5s
      retries: 5
+
+volumes:
+  ollama-models: