CrispChat

Sleeping

App Files Files Community

cstr commited on about 1 month ago

Commit

3dc43a9

verified ·

1 Parent(s): 6ee626f

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -21

app.py CHANGED Viewed

@@ -226,11 +226,18 @@ def encode_image_to_base64(image_path):
                 elif file_extension == "webp":
                     mime_type = "image/webp"
                 return f"data:{mime_type};base64,{encoded_string}"
-        elif Image is not None and hasattr(image_path, 'save'):  # Pillow Image
-            buffered = io.BytesIO()
-            image_path.save(buffered, format="PNG")
-            encoded_string = base64.b64encode(buffered.getvalue()).decode('utf-8')
-            return f"data:image/png;base64,{encoded_string}"
         else:  # Handle file object or other types
             logger.error(f"Unsupported image type: {type(image_path)}")
             return None
@@ -283,7 +290,9 @@ def prepare_message_with_media(text, images=None, documents=None):
         for doc in documents:
             if doc is None:
                 continue
-            doc_text = extract_text_from_file(doc)
             if doc_text:
                 document_texts.append(doc_text)
@@ -304,15 +313,27 @@ def prepare_message_with_media(text, images=None, documents=None):
     content = [{"type": "text", "text": text}]
     # Add images if any
-    if images and any(img is not None for img in images):
-        for img in images:
-            if img is None:
-                continue
-            encoded_image = encode_image_to_base64(img)
             if encoded_image:
                 content.append({
-                    "type": "image_url",
                     "image_url": {"url": encoded_image}
                 })
@@ -331,7 +352,7 @@ def format_to_message_dict(history):
     return messages
 def process_uploaded_images(files):
-    """Process uploaded image files - fixed for Gradio 4.44.1"""
     file_paths = []
     for file in files:
         if hasattr(file, 'name'):
@@ -640,12 +661,10 @@ def create_app():
                 with gr.Row():
                     # Image upload
                     with gr.Accordion("Upload Images (for vision models)", open=False):
-                        images = gr.Gallery(
-                            label="Uploaded Images",
-                            show_label=True,
-                            columns=4,
-                            height="auto",
-                            object_fit="contain"
                         )
                         image_upload_btn = gr.UploadButton(
@@ -907,7 +926,7 @@ def create_app():
         # Process uploaded images
         image_upload_btn.upload(
-            fn=process_uploaded_images,
             inputs=image_upload_btn,
             outputs=images
         )

                 elif file_extension == "webp":
                     mime_type = "image/webp"
                 return f"data:{mime_type};base64,{encoded_string}"
+        elif hasattr(image_path, 'name'):  # Handle Gradio file objects directly
+            with open(image_path.name, "rb") as image_file:
+                encoded_string = base64.b64encode(image_file.read()).decode('utf-8')
+                file_extension = image_path.name.split('.')[-1].lower()
+                mime_type = f"image/{file_extension}"
+                if file_extension in ["jpg", "jpeg"]:
+                    mime_type = "image/jpeg"
+                elif file_extension == "png":
+                    mime_type = "image/png"
+                elif file_extension == "webp":
+                    mime_type = "image/webp"
+                return f"data:{mime_type};base64,{encoded_string}"
         else:  # Handle file object or other types
             logger.error(f"Unsupported image type: {type(image_path)}")
             return None
         for doc in documents:
             if doc is None:
                 continue
+            # Make sure to handle file objects properly
+            doc_path = doc.name if hasattr(doc, 'name') else doc
+            doc_text = extract_text_from_file(doc_path)
             if doc_text:
                 document_texts.append(doc_text)
     content = [{"type": "text", "text": text}]
     # Add images if any
+    if images:
+        # Check if images is a list of image paths or file objects
+        if isinstance(images, list):
+            for img in images:
+                if img is None:
+                    continue
+                encoded_image = encode_image_to_base64(img)
+                if encoded_image:
+                    content.append({
+                        "type": "image_url",
+                        "image_url": {"url": encoded_image}
+                    })
+        else:
+            # For single image or Gallery component
+            logger.warning(f"Images is not a list: {type(images)}")
+            # Try to handle as single image
+            encoded_image = encode_image_to_base64(images)
             if encoded_image:
                 content.append({
+                    "type": "image_url",
                     "image_url": {"url": encoded_image}
                 })
     return messages
 def process_uploaded_images(files):
+    """Process uploaded image files"""
     file_paths = []
     for file in files:
         if hasattr(file, 'name'):
                 with gr.Row():
                     # Image upload
                     with gr.Accordion("Upload Images (for vision models)", open=False):
+                        images = gr.File(
+                            label="Uploaded Images",
+                            file_types=["image"],
+                            file_count="multiple"
                         )
                         image_upload_btn = gr.UploadButton(
         # Process uploaded images
         image_upload_btn.upload(
+            fn=lambda files: files,
             inputs=image_upload_btn,
             outputs=images
         )