Spaces:

KSh100
/

websearch

Build error

KSh100 commited on Apr 13, 2025

Commit

1db6081

verified ·

1 Parent(s): c866c44

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -52,16 +52,13 @@ def extract_images(soup, base_url):
         full_img_url = urljoin(base_url, img_url) if not img_url.startswith(("http://", "https://")) else img_url
         alt_text = img.get('alt', 'No Alt Text')
         images.append({"Alt Text": alt_text, "Image URL": full_img_url})
-    return images
 def format_detailed_output(structured_data, title):
-    """Formats the structured data into a Markdown string with each text, link, and image on a new line."""
     result = f"### Title\n\n{title}\n\n"
     result += "### Texts\n\n"
-    if structured_data["Texts"]:
-        result += "\n".join(structured_data["Texts"])
-    else:
-        result += "No textual content found."
     result += "\n\n### Links\n\n"
     if structured_data["Links"]:
         result += "\n".join(f"[{link['Text']}]({link['URL']})" for link in structured_data["Links"])

         full_img_url = urljoin(base_url, img_url) if not img_url.startswith(("http://", "https://")) else img_url
         alt_text = img.get('alt', 'No Alt Text')
         images.append({"Alt Text": alt_text, "Image URL": full_img_url})
+        return images
 def format_detailed_output(structured_data, title):
+    """Formats the structured data into a Markdown string."""
     result = f"### Title\n\n{title}\n\n"
     result += "### Texts\n\n"
+    result += " ".join(structured_data["Texts"]) if structured_data["Texts"] else "No textual content found."
     result += "\n\n### Links\n\n"
     if structured_data["Links"]:
         result += "\n".join(f"[{link['Text']}]({link['URL']})" for link in structured_data["Links"])