dailypapershackernews-dev

Running

App Files Files Community

akhaliq HF staff commited on Sep 20, 2024

Commit

8cf4d5d

verified ·

1 Parent(s): cc4c9e4

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -25

app.py CHANGED Viewed

@@ -41,11 +41,9 @@ class PaperManager:
         Returns a dictionary with counts for each type.
         """
         try:
-            print(f"Fetching repos for arxiv_id: {arxiv_id}")  # Debug
             response = requests.get(REPOS_API_URL_TEMPLATE.format(arxiv_id=arxiv_id))
             response.raise_for_status()
             data = response.json()
-            print(f"Repos data for arxiv_id {arxiv_id}: {data}")  # Debug
             counts = {'models': 0, 'datasets': 0, 'spaces': 0}
             for repo in data:
@@ -56,7 +54,6 @@ class PaperManager:
                     counts['datasets'] += 1
                 elif repo_type == 'space':
                     counts['spaces'] += 1
-            print(f"Counts for arxiv_id {arxiv_id}: {counts}")  # Debug
             return counts
         except requests.RequestException as e:
             print(f"Error fetching repos for arxiv_id {arxiv_id}: {e}")
@@ -75,30 +72,14 @@ class PaperManager:
                 print("No data received from API.")
                 return False
-            # Debug: Print keys of the first paper
-            print("Keys in the first paper:", data[0].keys())
             self.raw_papers = data  # Store raw data
             # Fetch repos counts concurrently
             with ThreadPoolExecutor(max_workers=20) as executor:
-                future_to_paper = {}
-                for paper in self.raw_papers:
-                    arxiv_id = paper.get('paper', {}).get('arxiv_id', '')
-                    print(f"Processing paper ID: {paper.get('paper', {}).get('id', '')}, arxiv_id: {arxiv_id}")  # Debug
-                    if arxiv_id:
-                        future = executor.submit(self.fetch_repos_counts, arxiv_id)
-                        future_to_paper[future] = paper
-                    else:
-                        # If no arxiv_id, set counts to zero
-                        paper['models'] = 0
-                        paper['datasets'] = 0
-                        paper['spaces'] = 0
                 for future in as_completed(future_to_paper):
                     paper = future_to_paper[future]
                     counts = future.result()
-                    print(f"Paper ID: {paper.get('paper', {}).get('id', '')}, Counts: {counts}")  # Debug
                     paper['models'] = counts['models']
                     paper['datasets'] = counts['datasets']
                     paper['spaces'] = counts['spaces']
@@ -124,7 +105,7 @@ class PaperManager:
         elif self.sort_method == "new":
             self.papers = sorted(
                 self.raw_papers,
-                key=lambda x: x.get('published_at', ''),
                 reverse=True
             )
         elif self.sort_method == "most_models":
@@ -171,7 +152,7 @@ class PaperManager:
         authors = ', '.join([author.get('name', '') for author in paper.get('paper', {}).get('authors', [])]) or 'Unknown'
         upvotes = paper.get('paper', {}).get('upvotes', 0)
         comments = paper.get('numComments', 0)
-        published_time_str = paper.get('published_at', datetime.now(timezone.utc).isoformat())
         try:
             published_time = datetime.fromisoformat(published_time_str.replace('Z', '+00:00'))
         except ValueError:
@@ -184,8 +165,6 @@ class PaperManager:
         datasets = paper.get('datasets', 0)
         spaces = paper.get('spaces', 0)
-        print(f"Formatting paper {rank}: Models={models}, Datasets={datasets}, Spaces={spaces}")  # Debug
         return f"""
         <tr class="athing">
             <td align="right" valign="top" class="title"><span class="rank">{rank}.</span></td>
@@ -254,7 +233,6 @@ def change_sort_method(method):
         return "<div class='no-papers'>Failed to sort papers. Please try again later.</div>"
 css = """
-/* Existing CSS remains unchanged */
 body {
     background-color: white;
     font-family: Verdana, Geneva, sans-serif;

         Returns a dictionary with counts for each type.
         """
         try:
             response = requests.get(REPOS_API_URL_TEMPLATE.format(arxiv_id=arxiv_id))
             response.raise_for_status()
             data = response.json()
             counts = {'models': 0, 'datasets': 0, 'spaces': 0}
             for repo in data:
                     counts['datasets'] += 1
                 elif repo_type == 'space':
                     counts['spaces'] += 1
             return counts
         except requests.RequestException as e:
             print(f"Error fetching repos for arxiv_id {arxiv_id}: {e}")
                 print("No data received from API.")
                 return False
             self.raw_papers = data  # Store raw data
             # Fetch repos counts concurrently
             with ThreadPoolExecutor(max_workers=20) as executor:
+                future_to_paper = {executor.submit(self.fetch_repos_counts, paper.get('paper', {}).get('arxiv_id', '')): paper for paper in self.raw_papers}
                 for future in as_completed(future_to_paper):
                     paper = future_to_paper[future]
                     counts = future.result()
                     paper['models'] = counts['models']
                     paper['datasets'] = counts['datasets']
                     paper['spaces'] = counts['spaces']
         elif self.sort_method == "new":
             self.papers = sorted(
                 self.raw_papers,
+                key=lambda x: x.get('publishedAt', ''),
                 reverse=True
             )
         elif self.sort_method == "most_models":
         authors = ', '.join([author.get('name', '') for author in paper.get('paper', {}).get('authors', [])]) or 'Unknown'
         upvotes = paper.get('paper', {}).get('upvotes', 0)
         comments = paper.get('numComments', 0)
+        published_time_str = paper.get('publishedAt', datetime.now(timezone.utc).isoformat())
         try:
             published_time = datetime.fromisoformat(published_time_str.replace('Z', '+00:00'))
         except ValueError:
         datasets = paper.get('datasets', 0)
         spaces = paper.get('spaces', 0)
         return f"""
         <tr class="athing">
             <td align="right" valign="top" class="title"><span class="rank">{rank}.</span></td>
         return "<div class='no-papers'>Failed to sort papers. Please try again later.</div>"
 css = """
 body {
     background-color: white;
     font-family: Verdana, Geneva, sans-serif;