File size: 305 Bytes
428a5aa
 
 
92bb964
 
 
 
428a5aa
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
import requests
from bs4 import BeautifulSoup


def extract_text(url: str):
    if url is None or url.strip() == '':
        return ''
    response = requests.get(url)
    soup = BeautifulSoup(response.text, "html.parser")
    text = '\n\n'.join(map(lambda p: p.text, soup.find_all('p')))
    return text