Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -64,7 +64,7 @@ def parse_links_and_content(ort):
|
|
64 |
if target_div:
|
65 |
links = [urljoin(base_url, a['href']) for a in target_div.find_all('a', href=True)]
|
66 |
texts = [a.text for a in target_div.find_all('a', href=True)]
|
67 |
-
all_links.extend(
|
68 |
all_links_text.extend(texts)
|
69 |
else:
|
70 |
print(f"Target div not found on page {page_number}")
|
@@ -86,7 +86,7 @@ def scrape_links(links):
|
|
86 |
soup = BeautifulSoup(response.content, 'html.parser')
|
87 |
target_nav = soup.select_one('.nav')
|
88 |
if target_nav:
|
89 |
-
details.append(target_nav.text.strip())
|
90 |
else:
|
91 |
details.append("No contact information found")
|
92 |
except Exception as e:
|
|
|
64 |
if target_div:
|
65 |
links = [urljoin(base_url, a['href']) for a in target_div.find_all('a', href=True)]
|
66 |
texts = [a.text for a in target_div.find_all('a', href=True)]
|
67 |
+
all_links.extend(links)
|
68 |
all_links_text.extend(texts)
|
69 |
else:
|
70 |
print(f"Target div not found on page {page_number}")
|
|
|
86 |
soup = BeautifulSoup(response.content, 'html.parser')
|
87 |
target_nav = soup.select_one('.nav')
|
88 |
if target_nav:
|
89 |
+
details.append(f"{link}: {target_nav.text.strip()}")
|
90 |
else:
|
91 |
details.append("No contact information found")
|
92 |
except Exception as e:
|