Spaces:

KSh100
/

websearch

Sleeping

App Files Files Community

KSh100 commited on Mar 26

Commit

bf6070d

verified ·

1 Parent(s): a7a0560

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -7

app.py CHANGED Viewed

@@ -81,7 +81,7 @@ def format_detailed_output(structured_data):
 # --- Web Page Processing Functions ---
-def download_and_process_web_page(url, clean=True):
     """Downloads a web page from a URL and processes its content."""
     if not url.startswith("http://") and not url.startswith("https://"):
         url = "http://" + url  # Prepend "http://" if not present
@@ -89,7 +89,7 @@ def download_and_process_web_page(url, clean=True):
     try:
         response = get(url)
         if response.status_code != 200:
-            return f"Error: Received status code {response.status_code}", 0
         soup = response.soup()
         structured_data = {
@@ -97,12 +97,12 @@ def download_and_process_web_page(url, clean=True):
             "Links": extract_links(soup, url),
             "Images": extract_images(soup, url)
         }
-        return format_detailed_output(structured_data), 0
     except urllib3.exceptions.HTTPError as e:
-        return f"Error: {e}", 0
     except Exception as e:
-        return f"Error processing web page: {e}", 0
 # --- Gradio Interface ---
@@ -110,11 +110,9 @@ iface = gr.Interface(
     fn=download_and_process_web_page,
     inputs=[
         gr.Textbox(lines=1, placeholder="Enter URL of the web page"),
-        gr.Checkbox(label="Clean Text", value=True),
     ],
     outputs=[
         gr.Markdown(label="Web Page Content"),
-        gr.Number(label="Content Length (characters)"),
     ],
     title="Enhanced Web Page Processor for Hugging Face Chat Tools",
     description="Enter the URL of a web page. The tool will extract and format its content, including text, links, and images. This tool is designed for use with Hugging Face Chat Tools. \n [https://hf.co/chat/tools/66f1a8159d41ad4398ebb711](https://hf.co/chat/tools/66f1a8159d41ad4398ebb711)",

 # --- Web Page Processing Functions ---
+def download_and_process_web_page(url):
     """Downloads a web page from a URL and processes its content."""
     if not url.startswith("http://") and not url.startswith("https://"):
         url = "http://" + url  # Prepend "http://" if not present
     try:
         response = get(url)
         if response.status_code != 200:
+            return f"Error: Received status code {response.status_code}"
         soup = response.soup()
         structured_data = {
             "Links": extract_links(soup, url),
             "Images": extract_images(soup, url)
         }
+        return format_detailed_output(structured_data)
     except urllib3.exceptions.HTTPError as e:
+        return f"Error: {e}"
     except Exception as e:
+        return f"Error processing web page: {e}"
 # --- Gradio Interface ---
     fn=download_and_process_web_page,
     inputs=[
         gr.Textbox(lines=1, placeholder="Enter URL of the web page"),
     ],
     outputs=[
         gr.Markdown(label="Web Page Content"),
     ],
     title="Enhanced Web Page Processor for Hugging Face Chat Tools",
     description="Enter the URL of a web page. The tool will extract and format its content, including text, links, and images. This tool is designed for use with Hugging Face Chat Tools. \n [https://hf.co/chat/tools/66f1a8159d41ad4398ebb711](https://hf.co/chat/tools/66f1a8159d41ad4398ebb711)",