Spaces:
Runtime error
Runtime error
File size: 524 Bytes
605d9a8 055aed6 605d9a8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 |
from fastapi import FastAPI
from transformers import AutoModelForCausalLM, AutoTokenizer
app = FastAPI()
# Load Fine-Tuned Model
model_name = "PygmalionAI/pygmalion-7b"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForCausalLM.from_pretrained(model_name)
@app.get("/chat")
def chat(msg: str):
inputs = tokenizer(msg, return_tensors="pt")
response = model.generate(**inputs, max_length=200)
return {"response": tokenizer.decode(response[0], skip_special_tokens=True)} |