Wolf369 commited on
Commit
a2415d5
·
1 Parent(s): 29efd95

Update prompt

Browse files
Files changed (1) hide show
  1. main.py +2 -2
main.py CHANGED
@@ -7,7 +7,7 @@ app = FastAPI()
7
 
8
  @app.get("/llm_inference")
9
  def read_root(
10
- prompts: List[str],
11
  model: str = "meta-llama/Llama-2-7b-hf",
12
  temperature: float = 0.,
13
  max_tokens: int = 1024) -> List:
@@ -15,6 +15,6 @@ def read_root(
15
 
16
  llm = LLM(model=model)
17
 
18
- response = llm.generate(prompts, sampling_params)
19
 
20
  return response
 
7
 
8
  @app.get("/llm_inference")
9
  def read_root(
10
+ prompt: str,
11
  model: str = "meta-llama/Llama-2-7b-hf",
12
  temperature: float = 0.,
13
  max_tokens: int = 1024) -> List:
 
15
 
16
  llm = LLM(model=model)
17
 
18
+ response = llm.generate([prompt], sampling_params)
19
 
20
  return response