Spaces:

benkada
/

aiWeb

Running

App Files Files Community

benkada commited on 4 days ago

Commit

cf9785c

verified ·

1 Parent(s): 2dd1f0a

Update main.py

Browse files

Files changed (1) hide show

main.py +5 -9

main.py CHANGED Viewed

@@ -20,7 +20,7 @@ PORT              = int(os.getenv("PORT", 7860))
 app = FastAPI(
     title       = "AI-Powered Web-App API",
     description = "Backend for summarisation, captioning & QA",
-    version     = "1.2.3",               # <-- bumped
 )
 app.add_middleware(
@@ -47,15 +47,12 @@ summary_client        = InferenceClient(
     timeout = 120,
 )
-# ➜ Upgraded QA model (higher accuracy than roberta-base)
 qa_client             = InferenceClient(
-    "deepset/roberta-large-squad2",
     token   = HUGGINGFACE_TOKEN,
-    timeout = 120,
 )
-# If you need multilingual support, swap for:
-# qa_client = InferenceClient("deepset/xlm-roberta-large-squad2",
-#                             token=HUGGINGFACE_TOKEN, timeout=120)
 image_caption_client  = InferenceClient(
     "nlpconnect/vit-gpt2-image-captioning",
@@ -114,7 +111,6 @@ async def summarize_document(file: UploadFile = File(...)):
 # -------------------- Image Caption ------------------------------------------
 @app.post("/api/caption")
 async def caption_image(image: UploadFile = File(...)):
-    """`image` field name matches frontend (was `file` before)."""
     try:
         img_bytes = await image.read()
         img       = Image.open(io.BytesIO(img_bytes)).convert("RGB")
@@ -149,7 +145,7 @@ async def question_answering(file: UploadFile = File(...),
             context  = (res.get("generated_text") if isinstance(res, dict)
                         else str(res))
         else:
-            context = process_uploaded_file(file)[:3000]
         if not context:
             return {"result": "No context – cannot answer."}

 app = FastAPI(
     title       = "AI-Powered Web-App API",
     description = "Backend for summarisation, captioning & QA",
+    version     = "1.2.4",               # <-- bumped
 )
 app.add_middleware(
     timeout = 120,
 )
+# ➜ Upgraded QA model to a BigBird-RoBERTa checkpoint (better for documents)
 qa_client             = InferenceClient(
+    "google/bigbird-roberta-base-squad2",
     token   = HUGGINGFACE_TOKEN,
+    timeout = 180,
 )
 image_caption_client  = InferenceClient(
     "nlpconnect/vit-gpt2-image-captioning",
 # -------------------- Image Caption ------------------------------------------
 @app.post("/api/caption")
 async def caption_image(image: UploadFile = File(...)):
     try:
         img_bytes = await image.read()
         img       = Image.open(io.BytesIO(img_bytes)).convert("RGB")
             context  = (res.get("generated_text") if isinstance(res, dict)
                         else str(res))
         else:
+            context = process_uploaded_file(file)[:4096]   # BigBird handles longer
         if not context:
             return {"result": "No context – cannot answer."}