Spaces:

xuwenhao83
/

vllm-test

Runtime error

Stanley Xu commited on Sep 23, 2023

Commit

2ae3a0e

1 Parent(s): 3cc40a3

add a simple vllm api application

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,13 +1,15 @@
----
-title: Vllm Test
-emoji: ⚡
-colorFrom: yellow
-colorTo: red
-sdk: gradio
-sdk_version: 3.44.4
-app_file: app.py
-pinned: false
-license: mit
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+# vllm-test
+conda create -n vllm_test python=3.11
+conda activate vllm_test
+pip install -r requirements.txt
+## environment settings
+Please set the following environment variables first
+```
+export SHOPPAL_VLLM_API_URL=
+export SHOPPAL_VLLM_MODEL_NAME=
+export SHOPPAL_VLLM_API_KEY=
+```

app.py ADDED Viewed

+import openai
+import gradio as gr
+import os
+openai.api_key = os.environ["SHOPPAL_VLLM_API_KEY"]
+openai.api_base = os.environ["SHOPPAL_VLLM_API_URL"]
+model_name = os.environ["SHOPPAL_VLLM_MODEL_NAME"]
+def predict(message, history):
+    history_openai_format = []
+    for human, assistant in history:
+        history_openai_format.append({"role": "user", "content": human })
+        history_openai_format.append({"role": "assistant", "content":assistant})
+    history_openai_format.append({"role": "user", "content": message})
+    response = openai.ChatCompletion.create(
+        model=model_name,
+        messages= history_openai_format,
+        stop=[" Human:", " Assistant:"],
+        temperature=0.5,
+        max_tokens=2048,
+    )
+    return response.choices[0].message.content
+gr.ChatInterface(predict).queue().launch()

requirements.txt ADDED Viewed

+aiofiles==23.2.1
+aiohttp==3.8.5
+aiosignal==1.3.1
+altair==5.1.1
+annotated-types==0.5.0
+anyio==3.7.1
+async-timeout==4.0.3
+attrs==23.1.0
+certifi==2023.7.22
+charset-normalizer==3.2.0
+click==8.1.7
+contourpy==1.1.1
+cycler==0.11.0
+fastapi==0.103.1
+ffmpy==0.3.1
+filelock==3.12.4
+fonttools==4.42.1
+frozenlist==1.4.0
+fsspec==2023.9.2
+gradio==3.44.4
+gradio_client==0.5.1
+h11==0.14.0
+httpcore==0.18.0
+httpx==0.25.0
+huggingface-hub==0.17.2
+idna==3.4
+importlib-resources==6.1.0
+Jinja2==3.1.2
+jsonschema==4.19.1
+jsonschema-specifications==2023.7.1
+kiwisolver==1.4.5
+MarkupSafe==2.1.3
+matplotlib==3.8.0
+multidict==6.0.4
+numpy==1.26.0
+openai==0.28.0
+orjson==3.9.7
+packaging==23.1
+pandas==2.1.1
+Pillow==10.0.1
+pydantic==2.3.0
+pydantic_core==2.6.3
+pydub==0.25.1
+pyparsing==3.1.1
+python-dateutil==2.8.2
+python-multipart==0.0.6
+pytz==2023.3.post1
+PyYAML==6.0.1
+referencing==0.30.2
+requests==2.31.0
+rpds-py==0.10.3
+semantic-version==2.10.0
+six==1.16.0
+sniffio==1.3.0
+starlette==0.27.0
+toolz==0.12.0
+tqdm==4.66.1
+typing_extensions==4.8.0
+tzdata==2023.3
+urllib3==2.0.5
+uvicorn==0.23.2
+websockets==11.0.3
+yarl==1.9.2