Spaces:
Running
on
A100
Running
on
A100
cupy
Browse files- Dockerfile +2 -3
Dockerfile
CHANGED
@@ -34,7 +34,6 @@ RUN uv pip install vllm==0.7.2
|
|
34 |
RUN uv pip install --upgrade git+https://github.com/huggingface/transformers.git@336dc69d63d56f232a183a3e7f52790429b871ef
|
35 |
|
36 |
RUN uv pip install ray[adag]
|
|
|
37 |
|
38 |
-
|
39 |
-
|
40 |
-
ENTRYPOINT ["/bin/bash", "-c", ". .venv/bin/activate && python -m vllm.entrypoints.openai.api_server --model convergence-ai/proxy-lite --trust-remote-code --tokenizer-pool-size 20 --limit-mm-per-prompt image=1 --enable-auto-tool-choice --tool-call-parser hermes --port 7860"]
|
|
|
34 |
RUN uv pip install --upgrade git+https://github.com/huggingface/transformers.git@336dc69d63d56f232a183a3e7f52790429b871ef
|
35 |
|
36 |
RUN uv pip install ray[adag]
|
37 |
+
RUN uv pip install cupy
|
38 |
|
39 |
+
ENTRYPOINT ["/bin/bash", "-c", ". .venv/bin/activate && export VLLM_USE_V1=1 && python -m vllm.entrypoints.openai.api_server --model convergence-ai/proxy-lite --trust-remote-code --tokenizer-pool-size 20 --limit-mm-per-prompt image=1 --enable-auto-tool-choice --tool-call-parser hermes --port 7860"]
|
|
|
|