FreeBibTec2

Sleeping

App Files Files Community

C2MV commited on Dec 14, 2024

Commit

0e74018

verified ·

1 Parent(s): 707bdc5

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -12

app.py CHANGED Viewed

@@ -283,7 +283,6 @@ class PaperDownloader:
             logger.error(f"Error processing {doi}: {e}")
             return None, f"Error processing {doi}: {e}", f"Error processing {doi}: {e}"
     async def download_multiple_dois_async(self, dois_text):
         """Downloads multiple papers from a list of DOIs"""
         if not dois_text:
@@ -299,13 +298,12 @@ class PaperDownloader:
         for i, doi in enumerate(tqdm(dois, desc="Downloading papers")):
             filepath, success_message, fail_message = await self.download_single_doi_async(doi)
             if filepath:
-                 # Unique filename for zip
                 filename = f"{str(doi).replace('/', '_').replace('.', '_')}_{i}.pdf"
                 filepath_unique = os.path.join(self.output_dir, filename)
                 os.rename(filepath, filepath_unique)
                 downloaded_files.append(filepath_unique)
                 downloaded_links.append(f'<a href="https://doi.org/{doi}">{doi}</a>')
             else:
                 failed_dois.append(f'<a href="https://doi.org/{doi}">{doi}</a>')
@@ -318,7 +316,6 @@ class PaperDownloader:
         return zip_filename if downloaded_files else None, "\n".join(downloaded_links), "\n".join(failed_dois)
     async def process_bibtex_async(self, bib_file):
         """Process BibTeX file and download papers with multiple strategies"""
         # Read BibTeX file content from the uploaded object
@@ -327,14 +324,14 @@ class PaperDownloader:
                 bib_content = f.read()
         except Exception as e:
             logger.error(f"Error reading uploaded file {bib_file.name}: {e}")
-            return None, f"Error reading uploaded file {bib_file.name}: {e}", f"Error reading uploaded file {bib_file.name}: {e}", None
         # Parse BibTeX data
         try:
             bib_database = bibtexparser.loads(bib_content)
         except Exception as e:
             logger.error(f"Error parsing BibTeX data: {e}")
-            return None, f"Error parsing BibTeX data: {e}", f"Error parsing BibTeX data: {e}", None
         # Extract DOIs
         dois = [entry.get('doi') for entry in bib_database.entries if entry.get('doi')]
@@ -346,7 +343,7 @@ class PaperDownloader:
         downloaded_links = []
         # Download PDFs
-        for i,doi in enumerate(tqdm(dois, desc="Downloading papers")):
             try:
                 # Try to download with multiple methods with retries
                 pdf_content = await self.download_with_retry_async(doi)
@@ -354,7 +351,7 @@ class PaperDownloader:
                 # Save PDF
                 if pdf_content:
                     if doi is None:
-                        return None, "Error: DOI not provided", "Error: DOI not provided", None
                     filename = f"{str(doi).replace('/', '_').replace('.', '_')}_{i}.pdf"
                     filepath = os.path.join(self.output_dir, filename)
@@ -379,8 +376,7 @@ class PaperDownloader:
                     zipf.write(file_path, arcname=os.path.basename(file_path))
             logger.info(f"ZIP file created: {zip_filename}")
-        return zip_filename, "\n".join(downloaded_links), "\n".join(failed_dois), None
 def create_gradio_interface():
     """Create Gradio interface for Paper Downloader"""
@@ -392,7 +388,7 @@ def create_gradio_interface():
             if not bib_file.name.lower().endswith('.bib'):
                 return None, "Error: Please upload a .bib file", "Error: Please upload a .bib file", None
-            zip_path, downloaded_dois, failed_dois,  = await downloader.process_bibtex_async(bib_file)
             return zip_path, downloaded_dois, failed_dois, None
         elif doi_input:
             filepath, message, failed_doi = await downloader.download_single_doi_async(doi_input)
@@ -403,6 +399,7 @@ def create_gradio_interface():
         else:
             return None, "Please provide a .bib file, a single DOI, or a list of DOIs", "Please provide a .bib file, a single DOI, or a list of DOIs", None
     # Gradio Interface
     interface = gr.Interface(
         fn=download_papers,
@@ -429,7 +426,7 @@ def create_gradio_interface():
                     <div id="failed-dois"></div>
                 </div>
             """),
-            gr.File(label="Downloaded Single PDF")
         ],
         title="🔬 Academic Paper Batch Downloader",
         description="Upload a BibTeX file or enter DOIs to download PDFs. We'll attempt to fetch PDFs from multiple sources like Sci-Hub, Libgen, Google Scholar and Crossref. You can use any of the three inputs at any moment.",

             logger.error(f"Error processing {doi}: {e}")
             return None, f"Error processing {doi}: {e}", f"Error processing {doi}: {e}"
     async def download_multiple_dois_async(self, dois_text):
         """Downloads multiple papers from a list of DOIs"""
         if not dois_text:
         for i, doi in enumerate(tqdm(dois, desc="Downloading papers")):
             filepath, success_message, fail_message = await self.download_single_doi_async(doi)
             if filepath:
+                # Unique filename for zip
                 filename = f"{str(doi).replace('/', '_').replace('.', '_')}_{i}.pdf"
                 filepath_unique = os.path.join(self.output_dir, filename)
                 os.rename(filepath, filepath_unique)
                 downloaded_files.append(filepath_unique)
                 downloaded_links.append(f'<a href="https://doi.org/{doi}">{doi}</a>')
             else:
                 failed_dois.append(f'<a href="https://doi.org/{doi}">{doi}</a>')
         return zip_filename if downloaded_files else None, "\n".join(downloaded_links), "\n".join(failed_dois)
     async def process_bibtex_async(self, bib_file):
         """Process BibTeX file and download papers with multiple strategies"""
         # Read BibTeX file content from the uploaded object
                 bib_content = f.read()
         except Exception as e:
             logger.error(f"Error reading uploaded file {bib_file.name}: {e}")
+            return None, f"Error reading uploaded file {bib_file.name}: {e}", f"Error reading uploaded file {bib_file.name}: {e}"
         # Parse BibTeX data
         try:
             bib_database = bibtexparser.loads(bib_content)
         except Exception as e:
             logger.error(f"Error parsing BibTeX data: {e}")
+            return None, f"Error parsing BibTeX data: {e}", f"Error parsing BibTeX data: {e}"
         # Extract DOIs
         dois = [entry.get('doi') for entry in bib_database.entries if entry.get('doi')]
         downloaded_links = []
         # Download PDFs
+        for i, doi in enumerate(tqdm(dois, desc="Downloading papers")):
             try:
                 # Try to download with multiple methods with retries
                 pdf_content = await self.download_with_retry_async(doi)
                 # Save PDF
                 if pdf_content:
                     if doi is None:
+                        return None, "Error: DOI not provided", "Error: DOI not provided"
                     filename = f"{str(doi).replace('/', '_').replace('.', '_')}_{i}.pdf"
                     filepath = os.path.join(self.output_dir, filename)
                     zipf.write(file_path, arcname=os.path.basename(file_path))
             logger.info(f"ZIP file created: {zip_filename}")
+        return zip_filename, "\n".join(downloaded_links), "\n".join(failed_dois)
 def create_gradio_interface():
     """Create Gradio interface for Paper Downloader"""
             if not bib_file.name.lower().endswith('.bib'):
                 return None, "Error: Please upload a .bib file", "Error: Please upload a .bib file", None
+            zip_path, downloaded_dois, failed_dois = await downloader.process_bibtex_async(bib_file)
             return zip_path, downloaded_dois, failed_dois, None
         elif doi_input:
             filepath, message, failed_doi = await downloader.download_single_doi_async(doi_input)
         else:
             return None, "Please provide a .bib file, a single DOI, or a list of DOIs", "Please provide a .bib file, a single DOI, or a list of DOIs", None
     # Gradio Interface
     interface = gr.Interface(
         fn=download_papers,
                     <div id="failed-dois"></div>
                 </div>
             """),
+           gr.File(label="Downloaded Single PDF")
         ],
         title="🔬 Academic Paper Batch Downloader",
         description="Upload a BibTeX file or enter DOIs to download PDFs. We'll attempt to fetch PDFs from multiple sources like Sci-Hub, Libgen, Google Scholar and Crossref. You can use any of the three inputs at any moment.",