parent
3510af1fbd
commit
d57debe0d4
@ -0,0 +1,38 @@
|
||||
version: '3.8'
|
||||
|
||||
services:
|
||||
rezero:
|
||||
build:
|
||||
context: .
|
||||
dockerfile: Dockerfile
|
||||
image: rezero
|
||||
container_name: rezero
|
||||
volumes:
|
||||
- .:/app
|
||||
# Windows-compatible path for huggingface cache
|
||||
- ${USERPROFILE}/.cache/huggingface:/root/.cache/huggingface
|
||||
ports:
|
||||
- "7860:7860" # Gradio web interface
|
||||
env_file:
|
||||
- .env
|
||||
# Windows with Docker Desktop + WSL2 uses this format
|
||||
environment:
|
||||
- NVIDIA_VISIBLE_DEVICES=all
|
||||
- GRADIO_SERVER_NAME=0.0.0.0
|
||||
- GRADIO_SERVER_PORT=7860
|
||||
- GRADIO_SHARE=False
|
||||
- GENERATOR_MODEL_DIR=Menlo/ReZero-v0.1-llama-3.2-3b-it-grpo-250404
|
||||
# Use runtime instead of deploy for Windows Docker Desktop
|
||||
runtime: nvidia
|
||||
# Create model directory and run the app
|
||||
command: >
|
||||
bash -c "mkdir -p /app/models/generator &&
|
||||
python app.py"
|
||||
restart: unless-stopped
|
||||
shm_size: 8gb
|
||||
healthcheck:
|
||||
test: ["CMD", "curl", "-f", "http://localhost:7860/"]
|
||||
interval: 30s
|
||||
timeout: 10s
|
||||
retries: 3
|
||||
start_period: 40s
|
Loading…
Reference in new issue