dailypapershackernews-dev

Sleeping

App Files Files Community

akhaliq HF staff commited on Sep 20

Commit

628eca7

•

1 Parent(s): 8cf4d5d

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -7

app.py CHANGED Viewed

@@ -40,23 +40,40 @@ class PaperManager:
         Fetch the repositories (models, datasets, Spaces) associated with a given arxiv_id.
         Returns a dictionary with counts for each type.
         """
         try:
             response = requests.get(REPOS_API_URL_TEMPLATE.format(arxiv_id=arxiv_id))
             response.raise_for_status()
             data = response.json()
             counts = {'models': 0, 'datasets': 0, 'spaces': 0}
             for repo in data:
-                repo_type = repo.get('type', '').lower()
-                if repo_type == 'model':
                     counts['models'] += 1
-                elif repo_type == 'dataset':
                     counts['datasets'] += 1
-                elif repo_type == 'space':
                     counts['spaces'] += 1
             return counts
         except requests.RequestException as e:
-            print(f"Error fetching repos for arxiv_id {arxiv_id}: {e}")
             return {'models': 0, 'datasets': 0, 'spaces': 0}
         except Exception as e:
             print(f"Unexpected error fetching repos for arxiv_id {arxiv_id}: {e}")
@@ -74,9 +91,17 @@ class PaperManager:
             self.raw_papers = data  # Store raw data
             # Fetch repos counts concurrently
             with ThreadPoolExecutor(max_workers=20) as executor:
-                future_to_paper = {executor.submit(self.fetch_repos_counts, paper.get('paper', {}).get('arxiv_id', '')): paper for paper in self.raw_papers}
                 for future in as_completed(future_to_paper):
                     paper = future_to_paper[future]
                     counts = future.result()
@@ -201,11 +226,13 @@ class PaperManager:
     def next_page(self):
         if self.current_page < self.total_pages:
             self.current_page += 1
         return self.render_papers()
     def prev_page(self):
         if self.current_page > 1:
             self.current_page -= 1
         return self.render_papers()
 paper_manager = PaperManager()
@@ -416,4 +443,4 @@ with demo:
         outputs=[paper_list]
     )
-demo.launch()

         Fetch the repositories (models, datasets, Spaces) associated with a given arxiv_id.
         Returns a dictionary with counts for each type.
         """
+        if not arxiv_id:
+            print("Empty arxiv_id provided.")
+            return {'models': 0, 'datasets': 0, 'spaces': 0}
         try:
+            print(f"Fetching repositories for arxiv_id: {arxiv_id}")
             response = requests.get(REPOS_API_URL_TEMPLATE.format(arxiv_id=arxiv_id))
             response.raise_for_status()
             data = response.json()
+            # Debugging: Print the fetched data
+            print(f"Repositories data for {arxiv_id}: {data}")
             counts = {'models': 0, 'datasets': 0, 'spaces': 0}
             for repo in data:
+                repo_type = repo.get('type', '').strip().lower()
+                print(f"Repo type found: {repo_type}")  # Debugging
+                if repo_type == 'models':
                     counts['models'] += 1
+                elif repo_type == 'datasets':
                     counts['datasets'] += 1
+                elif repo_type == 'spaces':
                     counts['spaces'] += 1
+                else:
+                    print(f"Unknown repo type: {repo_type}")  # Debugging unknown types
+            print(f"Counts for {arxiv_id}: {counts}")  # Debugging
             return counts
         except requests.RequestException as e:
+            print(f"HTTP error fetching repos for arxiv_id {arxiv_id}: {e}")
+            return {'models': 0, 'datasets': 0, 'spaces': 0}
+        except ValueError as e:
+            print(f"JSON decoding error for arxiv_id {arxiv_id}: {e}")
             return {'models': 0, 'datasets': 0, 'spaces': 0}
         except Exception as e:
             print(f"Unexpected error fetching repos for arxiv_id {arxiv_id}: {e}")
             self.raw_papers = data  # Store raw data
+            # Debugging: Print some arxiv_ids
+            for paper in self.raw_papers[:5]:
+                arxiv_id = paper.get('paper', {}).get('arxiv_id', '')
+                print(f"Sample arxiv_id: {arxiv_id}")
             # Fetch repos counts concurrently
             with ThreadPoolExecutor(max_workers=20) as executor:
+                future_to_paper = {
+                    executor.submit(self.fetch_repos_counts, paper.get('paper', {}).get('arxiv_id', '')): paper
+                    for paper in self.raw_papers
+                }
                 for future in as_completed(future_to_paper):
                     paper = future_to_paper[future]
                     counts = future.result()
     def next_page(self):
         if self.current_page < self.total_pages:
             self.current_page += 1
+        print(f"Navigated to page {self.current_page}")  # Debug
         return self.render_papers()
     def prev_page(self):
         if self.current_page > 1:
             self.current_page -= 1
+        print(f"Navigated to page {self.current_page}")  # Debug
         return self.render_papers()
 paper_manager = PaperManager()
         outputs=[paper_list]
     )
+demo.launch()