diff --git a/swarms/server/dockerRunVllm.sh b/swarms/server/dockerRunVllm.sh new file mode 100644 index 00000000..ace21b2a --- /dev/null +++ b/swarms/server/dockerRunVllm.sh @@ -0,0 +1,8 @@ +docker run --runtime nvidia --gpus all \ + -v ~/.cache/huggingface:/root/.cache/huggingface \ + --env "HUGGING_FACE_HUB_TOKEN=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" \ + -p 8000:8000 \ + --network=host \ + --name vllm \ + vllm/vllm-openai:latest \ + --model NousResearch/Meta-Llama-3-8B-Instruct \ No newline at end of file