Spaces:
Runtime error
Runtime error
debug
Browse files
main.py
CHANGED
@@ -13,7 +13,7 @@ app = FastAPI()
|
|
13 |
@app.get("/llm_inference")
|
14 |
def read_root(
|
15 |
prompt: str,
|
16 |
-
model: str = "meta-llama/Llama-2-7b-hf",
|
17 |
temperature: float = 0.,
|
18 |
max_tokens: int = 1024) -> List:
|
19 |
sampling_params = SamplingParams(temperature=temperature, max_tokens=max_tokens)
|
|
|
13 |
@app.get("/llm_inference")
|
14 |
def read_root(
|
15 |
prompt: str,
|
16 |
+
model: str = "meta-llama/Llama-2-7b-chat-hf",
|
17 |
temperature: float = 0.,
|
18 |
max_tokens: int = 1024) -> List:
|
19 |
sampling_params = SamplingParams(temperature=temperature, max_tokens=max_tokens)
|