Update to use correct HF dataset: modelbiome/ai_ecosystem
Browse files- Changed from ai_ecosystem_withmodelcards to ai_ecosystem
- This enables access to full 1.86M+ model dataset
backend.log
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
INFO: Will watch for changes in these directories: ['/Users/hamidaho/hf_viz/backend']
|
| 2 |
+
INFO: Uvicorn running on http://0.0.0.0:8000 (Press CTRL+C to quit)
|
| 3 |
+
INFO: Started reloader process [24332] using WatchFiles
|
| 4 |
+
INFO: Started server process [24386]
|
| 5 |
+
INFO: Waiting for application startup.
|
| 6 |
+
Repo card metadata block was not found. Setting CardData to empty.
|
backend/services/model_tracker_improved.py
CHANGED
|
@@ -259,7 +259,7 @@ class ImprovedModelCountTracker:
|
|
| 259 |
logger.error(f"Error extracting count from HF models page: {e}", exc_info=True)
|
| 260 |
return None
|
| 261 |
|
| 262 |
-
def get_count_from_dataset_snapshot(self, dataset_name: str = "modelbiome/
|
| 263 |
"""
|
| 264 |
Alternative method: Get count from dataset snapshot (like ai-ecosystem repo does).
|
| 265 |
This is faster but may be slightly outdated.
|
|
|
|
| 259 |
logger.error(f"Error extracting count from HF models page: {e}", exc_info=True)
|
| 260 |
return None
|
| 261 |
|
| 262 |
+
def get_count_from_dataset_snapshot(self, dataset_name: str = "modelbiome/ai_ecosystem") -> Optional[Dict]:
|
| 263 |
"""
|
| 264 |
Alternative method: Get count from dataset snapshot (like ai-ecosystem repo does).
|
| 265 |
This is faster but may be slightly outdated.
|
backend/utils/data_loader.py
CHANGED
|
@@ -10,7 +10,7 @@ import numpy as np
|
|
| 10 |
class ModelDataLoader:
|
| 11 |
"""Load and preprocess model data from Hugging Face dataset."""
|
| 12 |
|
| 13 |
-
def __init__(self, dataset_name: str = "modelbiome/
|
| 14 |
self.dataset_name = dataset_name
|
| 15 |
self.df: Optional[pd.DataFrame] = None
|
| 16 |
|
|
|
|
| 10 |
class ModelDataLoader:
|
| 11 |
"""Load and preprocess model data from Hugging Face dataset."""
|
| 12 |
|
| 13 |
+
def __init__(self, dataset_name: str = "modelbiome/ai_ecosystem"):
|
| 14 |
self.dataset_name = dataset_name
|
| 15 |
self.df: Optional[pd.DataFrame] = None
|
| 16 |
|