Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -41,9 +41,10 @@ def parse_links_and_content(ort):
|
|
41 |
target_div = soup.select_one('div.row-cols-1:nth-child(4)')
|
42 |
|
43 |
if target_div:
|
44 |
-
links = [urljoin(base_url, a['href']) for a in target_div.find_all('a', href=True)]
|
45 |
-
|
46 |
-
|
|
|
47 |
else:
|
48 |
print(f"Target div not found on page {page_number}")
|
49 |
|
|
|
41 |
target_div = soup.select_one('div.row-cols-1:nth-child(4)')
|
42 |
|
43 |
if target_div:
|
44 |
+
#links = [urljoin(base_url, a['href']) for a in target_div.find_all('a', href=True)]
|
45 |
+
texts = [a.text for a in target_div.find_all('a', href=True)]
|
46 |
+
#all_texts.extend(texts)
|
47 |
+
all_links.extend(texts)
|
48 |
else:
|
49 |
print(f"Target div not found on page {page_number}")
|
50 |
|