Spaces:
Runtime error
Runtime error
File size: 467 Bytes
836bc0e |
1 2 3 4 5 6 7 8 9 10 11 12 |
from bs4 import BeautifulSoup
def extract_text_from_html(content):
try:
soup = BeautifulSoup(content, "html.parser")
text = soup.get_text(separator="\n")
lines = [t.strip() for t in text.splitlines() if t.strip()]
return lines if lines else ["No data found in this document (empty HTML)"]
except Exception as e:
print(f"❌ HTML parse failed: {str(e)}")
return [f"No data found in this document (HTML error)"]
|