Codestin Search App

185 lines (178 loc) · 5.32 KB
version: '3.8'
  temporal:
    image: temporalio/auto-setup:latest
      - "7233:7233"
    environment:
      - DB=postgres12
      - DB_PORT=5432
      - POSTGRES_USER=temporal
      - POSTGRES_PWD=temporal
      - POSTGRES_SEEDS=postgres
      - DBNAME=temporal
      - VISIBILITY_DBNAME=temporal_visibility
      # Workflow retention: 7 days (168 hours)
      - DEFAULT_NAMESPACE_RETENTION=168h
    depends_on:
      - postgres
    networks:
      - whisperx-network
    healthcheck:
      test: ["CMD", "tctl", "--address", "temporal:7233", "cluster", "health"]
      interval: 30s
      timeout: 10s
      retries: 5
      start_period: 90s
  postgres:
    image: postgres:13
    environment:
      - POSTGRES_PASSWORD=temporal
      - POSTGRES_USER=temporal
      - POSTGRES_DB=temporal
    volumes:
      - postgres-data:/var/lib/postgresql/data
    networks:
      - whisperx-network
    healthcheck:
      test: ["CMD-SHELL", "pg_isready -U temporal"]
      interval: 10s
      timeout: 5s
      retries: 5
  # WhisperX FastAPI Application with GPU
  whisperx-api:
      context: .
      dockerfile: Dockerfile
      args:
        - INSTALL_GPU=true
      - "8000:8000"
    environment:
      # Secrets from .env
      - HF_TOKEN=${HF_TOKEN:-}
      - ENVIRONMENT=${ENVIRONMENT:-production}
      - LOG_LEVEL=${LOG_LEVEL:-INFO}
      - DIARIZATION_MODEL_PATH=${DIARIZATION_MODEL_PATH:-}
      - TEMPORAL_SERVER_URL=temporal:7233
      - HIPAA_ENCRYPTION_KEY=${HIPAA_ENCRYPTION_KEY:-default}
      # LM Studio configuration for medical processing (host.docker.internal for Docker-to-host connectivity)
      - LM_STUDIO_BASE_URL=${LM_STUDIO_BASE_URL:-http://host.docker.internal:1234/v1}
      - LM_STUDIO_MODEL=${LM_STUDIO_MODEL:-}
      - LM_STUDIO_MAX_TOKENS=${LM_STUDIO_MAX_TOKENS:-8192}
      - EMBEDDING_MODEL=${EMBEDDING_MODEL:-text-embedding-bge-reranker-v2-m3}
      - EMBEDDING_DIMENSION=${EMBEDDING_DIMENSION:-1024}
    volumes:
      # Config file (runtime defaults)
      - ./config.yaml:/app/config.yaml:ro
      # Model cache
      - whisperx-huggingface-cache:/root/.cache/huggingface
      - whisperx-torch-cache:/root/.cache/torch
      # Shared file uploads (Docker volume, not host directory)
      - whisperx-uploads:/tmp/uploads
      # Data persistence
      - ./vector_storage:/app/vector_storage
      - ./data:/app/data
      - ./audit_logs:/app/audit_logs
    depends_on:
      temporal:
        condition: service_healthy
    networks:
      - whisperx-network
    extra_hosts:
      - "host.docker.internal:host-gateway"
    restart: unless-stopped
    deploy:
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: 1
              capabilities: [gpu]
    healthcheck:
      test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
      interval: 30s
      timeout: 10s
      retries: 3
      start_period: 60s
  # Temporal Worker with GPU
  whisperx-worker:
      context: .
      dockerfile: Dockerfile
      args:
        - INSTALL_GPU=true
    stop_grace_period: 30s
    environment:
      # Secrets from .env
      - HF_TOKEN=${HF_TOKEN:-}
      - ENVIRONMENT=${ENVIRONMENT:-production}
      - LOG_LEVEL=${LOG_LEVEL:-INFO}
      - DIARIZATION_MODEL_PATH=${DIARIZATION_MODEL_PATH:-}
      - TEMPORAL_SERVER_URL=temporal:7233
      - HIPAA_ENCRYPTION_KEY=${HIPAA_ENCRYPTION_KEY:-default}
      # LM Studio configuration for medical processing (host.docker.internal for Docker-to-host connectivity)
      - LM_STUDIO_BASE_URL=${LM_STUDIO_BASE_URL:-http://host.docker.internal:1234/v1}
      - LM_STUDIO_MODEL=${LM_STUDIO_MODEL:-}
      - LM_STUDIO_MAX_TOKENS=${LM_STUDIO_MAX_TOKENS:-8192}
      - EMBEDDING_MODEL=${EMBEDDING_MODEL:-text-embedding-bge-reranker-v2-m3}
      - EMBEDDING_DIMENSION=${EMBEDDING_DIMENSION:-1024}
    volumes:
      # Config file (runtime defaults)
      - ./config.yaml:/app/config.yaml:ro
      # Model cache
      - whisperx-huggingface-cache:/root/.cache/huggingface
      - whisperx-torch-cache:/root/.cache/torch
      # File processing (Docker volume)
      - whisperx-uploads:/tmp/uploads
      # Data persistence
      - ./vector_storage:/app/vector_storage
      - ./data:/app/data
      - ./audit_logs:/app/audit_logs
    command: ["uv", "run", "python", "-m", "app.temporal.worker"]
    depends_on:
      temporal:
        condition: service_healthy
    networks:
      - whisperx-network
    extra_hosts:
      - "host.docker.internal:host-gateway"
    restart: unless-stopped
    deploy:
      replicas: 1
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: 1
              capabilities: [gpu]
  streamlit-ui:
      context: .
      dockerfile: Dockerfile.streamlit
      - "8501:8501"
    environment:
      - WHISPERX_API_URL=http://whisperx-api:8000
    volumes:
      - ./streamlit_app:/app/streamlit_app
    depends_on:
      whisperx-api:
        condition: service_healthy
    networks:
      - whisperx-network
    restart: unless-stopped
    healthcheck:
      test: ["CMD", "curl", "-f", "http://localhost:8501/_stcore/health"]
      interval: 30s
      timeout: 10s
      retries: 3
      start_period: 30s
  whisperx-network:
    driver: bridge
  postgres-data:
  whisperx-huggingface-cache:
  whisperx-torch-cache:
  whisperx-uploads:
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

docker-compose.gpu.yaml

Latest commit

History

docker-compose.gpu.yaml

File metadata and controls