itlevy esegal commited on
Commit
9c0e074
·
1 Parent(s): 2cb5290

Fix vLLM command (#10)

Browse files

- Fix vLLM command (03c1f724c639a7c9d8904cf26be3efd6a9c44b00)


Co-authored-by: Elad Segal <esegal@users.noreply.huggingface.co>

Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -267,7 +267,7 @@ docker run --gpus all -p 8000:8000 \
267
  vllm/vllm-openai:v0.17.1 \
268
  -c "
269
  apt-get update && apt-get install -y git &&
270
- VLLM_PRECOMPILED_WHEEL_LOCATION=https://wheels.vllm.ai/1ac2ef2e5335ca0af99aee438998c9305461f563/vllm-0.18.1rc1.dev127%2Bg1ac2ef2e5-cp38-abi3-manylinux_2_31_$(uname -m).whl VLLM_USE_PRECOMPILED=1 pip install --no-build-isolation 'git+https://github.com/vllm-project/vllm.git@refs/pull/38135/head' &&
271
  pip install flashinfer-cubin==0.6.6 flashinfer-jit-cache==0.6.6 --extra-index-url https://flashinfer.ai/whl/cu129 &&
272
  export PYTORCH_ALLOC_CONF=expandable_segments:True &&
273
  vllm serve nvidia/gpt-oss-puzzle-88B \
 
267
  vllm/vllm-openai:v0.17.1 \
268
  -c "
269
  apt-get update && apt-get install -y git &&
270
+ VLLM_PRECOMPILED_WHEEL_LOCATION=https://wheels.vllm.ai/1ac2ef2e5335ca0af99aee438998c9305461f563/vllm-0.18.1rc1.dev127%2Bg1ac2ef2e5-cp38-abi3-manylinux_2_31_$(uname -m).whl VLLM_USE_PRECOMPILED=1 pip install --no-build-isolation 'git+https://github.com/vllm-project/vllm.git@88f6aaad7cc2fe8904d5fcf31d06eb57f15a6d25' &&
271
  pip install flashinfer-cubin==0.6.6 flashinfer-jit-cache==0.6.6 --extra-index-url https://flashinfer.ai/whl/cu129 &&
272
  export PYTORCH_ALLOC_CONF=expandable_segments:True &&
273
  vllm serve nvidia/gpt-oss-puzzle-88B \