version: "3.9" # Two services: minimal and full. Pick whichever matches your runtime budget. services: tau-rag-slim: build: context: . target: slim image: tau-rag:slim ports: ["8000:8000"] restart: unless-stopped volumes: - ./runtime:/app/runtime # for signals.jsonl, snapshots, dashboards environment: - TAU_RAG_PRESET=no_llm tau-rag-full: build: context: . target: full image: tau-rag:full ports: ["8001:8000"] restart: unless-stopped volumes: - ./runtime:/app/runtime - hf-cache:/root/.cache/huggingface # cache AlephBERT between restarts environment: - TAU_RAG_PRESET=hebrew_dense - HF_HOME=/root/.cache/huggingface volumes: hf-cache: