Spaces:
Sleeping
Sleeping
File size: 603 Bytes
406e834 2fe6984 c209aa4 406e834 418e6bc 406e834 c209aa4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
from fastapi import FastAPI
from transformers import AutoModelForCausalLM, AutoTokenizer
model_name = "mynuddin/chatbot"
# Load model and tokenizer without setting a custom cache
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForCausalLM.from_pretrained(model_name).to("cpu")
app = FastAPI()
@app.post("/generate")
def generate_text(prompt: str):
inputs = tokenizer(prompt, return_tensors="pt")
output = model.generate(**inputs, max_length=128)
generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
return {"generated_query": generated_text}
|