version: '3.8' services: rezero: build: context: . dockerfile: Dockerfile image: rezero container_name: rezero volumes: - .:/app # Windows-compatible path for huggingface cache - ${USERPROFILE}/.cache/huggingface:/root/.cache/huggingface ports: - "7860:7860" # Gradio web interface env_file: - .env # Windows with Docker Desktop + WSL2 uses this format environment: - NVIDIA_VISIBLE_DEVICES=all - GRADIO_SERVER_NAME=0.0.0.0 - GRADIO_SERVER_PORT=7860 - GRADIO_SHARE=False - GENERATOR_MODEL_DIR=Menlo/ReZero-v0.1-llama-3.2-3b-it-grpo-250404 # Use runtime instead of deploy for Windows Docker Desktop runtime: nvidia # Create model directory and run the app command: > bash -c "mkdir -p /app/models/generator && python app.py" restart: unless-stopped shm_size: 8gb healthcheck: test: ["CMD", "curl", "-f", "http://localhost:7860/"] interval: 30s timeout: 10s retries: 3 start_period: 40s