Wolf369 commited on
Commit
ab9cab0
·
1 Parent(s): 2a9f20b
Files changed (1) hide show
  1. main.py +1 -1
main.py CHANGED
@@ -13,7 +13,7 @@ app = FastAPI()
13
  @app.get("/llm_inference")
14
  def read_root(
15
  prompt: str,
16
- model: str = "meta-llama/Llama-2-7b-hf",
17
  temperature: float = 0.,
18
  max_tokens: int = 1024) -> List:
19
  sampling_params = SamplingParams(temperature=temperature, max_tokens=max_tokens)
 
13
  @app.get("/llm_inference")
14
  def read_root(
15
  prompt: str,
16
+ model: str = "meta-llama/Llama-2-7b-chat-hf",
17
  temperature: float = 0.,
18
  max_tokens: int = 1024) -> List:
19
  sampling_params = SamplingParams(temperature=temperature, max_tokens=max_tokens)