Spaces:
Runtime error
Runtime error
Update prompt
Browse files
main.py
CHANGED
@@ -7,7 +7,7 @@ app = FastAPI()
|
|
7 |
|
8 |
@app.get("/llm_inference")
|
9 |
def read_root(
|
10 |
-
|
11 |
model: str = "meta-llama/Llama-2-7b-hf",
|
12 |
temperature: float = 0.,
|
13 |
max_tokens: int = 1024) -> List:
|
@@ -15,6 +15,6 @@ def read_root(
|
|
15 |
|
16 |
llm = LLM(model=model)
|
17 |
|
18 |
-
response = llm.generate(
|
19 |
|
20 |
return response
|
|
|
7 |
|
8 |
@app.get("/llm_inference")
|
9 |
def read_root(
|
10 |
+
prompt: str,
|
11 |
model: str = "meta-llama/Llama-2-7b-hf",
|
12 |
temperature: float = 0.,
|
13 |
max_tokens: int = 1024) -> List:
|
|
|
15 |
|
16 |
llm = LLM(model=model)
|
17 |
|
18 |
+
response = llm.generate([prompt], sampling_params)
|
19 |
|
20 |
return response
|