Spaces:
Sleeping
Sleeping
Commit
·
e7b63de
1
Parent(s):
3545aac
Update app.py
Browse files
app.py
CHANGED
@@ -572,19 +572,19 @@ async def resources_endpoint(profile: MedicalProfile):
|
|
572 |
folder_path = 'downloaded_articles/downloaded_articles'
|
573 |
initial_results = query_embeddings(query_embedding, embeddings_data, n_results=6)
|
574 |
file_path = 'finalcleaned_excel_file.xlsx'
|
575 |
-
|
576 |
-
|
577 |
-
|
578 |
|
579 |
# Retrieve original URLs
|
580 |
-
|
581 |
-
|
582 |
-
|
583 |
-
|
584 |
-
|
585 |
-
|
586 |
-
|
587 |
-
|
588 |
else:
|
589 |
print(f"Name: {file_name}")
|
590 |
document_ids = [doc_id for doc_id, _ in initial_results]
|
|
|
572 |
folder_path = 'downloaded_articles/downloaded_articles'
|
573 |
initial_results = query_embeddings(query_embedding, embeddings_data, n_results=6)
|
574 |
file_path = 'finalcleaned_excel_file.xlsx'
|
575 |
+
df = pd.read_excel(file_path)
|
576 |
+
file_name_to_url = {f"article_{index}.html": url for index, url in enumerate(df['Unnamed: 0'])}
|
577 |
+
file_names = document_ids
|
578 |
|
579 |
# Retrieve original URLs
|
580 |
+
for file_name in file_names:
|
581 |
+
original_url = file_name_to_url.get(file_name, None)
|
582 |
+
if original_url:
|
583 |
+
title = get_page_title(original_url)
|
584 |
+
if title:
|
585 |
+
print(f"Title: {title},URL: {original_url}")
|
586 |
+
else:
|
587 |
+
print(f"Name: {file_name}")
|
588 |
else:
|
589 |
print(f"Name: {file_name}")
|
590 |
document_ids = [doc_id for doc_id, _ in initial_results]
|