diff --git a/backend/README.md b/backend/README.md
deleted file mode 100644
index 4e6bf71c7455538db98de6e1adc059efef73b083..0000000000000000000000000000000000000000
--- a/backend/README.md
+++ /dev/null
@@ -1,24 +0,0 @@
-# Backend API
-
-FastAPI backend for serving model data to the React frontend.
-
-## Structure
-
-- `api/` - API routes and main application
-- `services/` - External service integrations (arXiv, model tracking, scheduling)
-- `utils/` - Utility modules (data loading, embeddings, dimensionality reduction, clustering, network analysis)
-- `config/` - Configuration files (requirements.txt, etc.)
-- `cache/` - Cached data (embeddings, reduced dimensions)
-
-## Running
-
-```bash
-cd backend
-uvicorn api.main:app --reload --host 0.0.0.0 --port 8000
-```
-
-## Environment Variables
-
-- `SAMPLE_SIZE` - Limit number of models to load (for development). Set to 0 or leave unset to load all models.
-
-
diff --git a/backend/api/dependencies.py b/backend/api/dependencies.py
new file mode 100644
index 0000000000000000000000000000000000000000..9b755ecace186f059d133d1fb23ef8a8625c0bcb
--- /dev/null
+++ b/backend/api/dependencies.py
@@ -0,0 +1,23 @@
+"""Shared dependencies for API routes."""
+import pandas as pd
+import numpy as np
+from typing import Optional, Dict
+from utils.data_loader import ModelDataLoader
+from utils.embeddings import ModelEmbedder
+from utils.dimensionality_reduction import DimensionReducer
+from utils.graph_embeddings import GraphEmbedder
+
+# Global state (initialized in startup) - these are module-level variables
+# that will be updated by main.py during startup
+data_loader = ModelDataLoader()
+embedder: Optional[ModelEmbedder] = None
+graph_embedder: Optional[GraphEmbedder] = None
+reducer: Optional[DimensionReducer] = None
+df: Optional[pd.DataFrame] = None
+embeddings: Optional[np.ndarray] = None
+graph_embeddings_dict: Optional[Dict[str, np.ndarray]] = None
+combined_embeddings: Optional[np.ndarray] = None
+reduced_embeddings: Optional[np.ndarray] = None
+reduced_embeddings_graph: Optional[np.ndarray] = None
+cluster_labels: Optional[np.ndarray] = None
+
diff --git a/backend/api/main.py b/backend/api/main.py
index 106b009ab38b4976fd0e9d36b885c899c6573f85..884e92852f48cd0a1465db49243eed30e4a7f463 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -1,202 +1,216 @@
-"""
-FastAPI backend for serving model data to React/Visx frontend.
-"""
 import sys
 import os
-backend_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
-if backend_dir not in sys.path:
-    sys.path.insert(0, backend_dir)
+import pickle
+import tempfile
+import logging
+from typing import Optional, List, Dict
+from datetime import datetime, timedelta
 
+import pandas as pd
+import numpy as np
+import httpx
 from fastapi import FastAPI, HTTPException, Query, BackgroundTasks, Request
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.middleware.gzip import GZipMiddleware
 from fastapi.responses import FileResponse, JSONResponse
 from fastapi.exceptions import RequestValidationError
 from starlette.exceptions import HTTPException as StarletteHTTPException
-from typing import Optional, List, Dict
-import pandas as pd
-import numpy as np
 from pydantic import BaseModel
 from umap import UMAP
-import tempfile
-import traceback
-import httpx
 
 from utils.data_loader import ModelDataLoader
 from utils.embeddings import ModelEmbedder
 from utils.dimensionality_reduction import DimensionReducer
 from utils.network_analysis import ModelNetworkBuilder
+from utils.graph_embeddings import GraphEmbedder
 from services.model_tracker import get_tracker
-from services.model_tracker_improved import get_improved_tracker
 from services.arxiv_api import extract_arxiv_ids, fetch_arxiv_papers
+from core.config import settings
+from core.exceptions import DataNotLoadedError, EmbeddingsNotReadyError
+from models.schemas import ModelPoint
+from utils.family_tree import calculate_family_depths
+import api.dependencies as deps
+from api.routes import models, stats, clusters
+
+# Create aliases for backward compatibility with existing routes
+# Note: These are set at module load time and may be None initially
+# Functions should access via deps.* to get current values
+data_loader = deps.data_loader
+
+backend_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+if backend_dir not in sys.path:
+    sys.path.insert(0, backend_dir)
 
-app = FastAPI(title="HF Model Ecosystem API")
+logger = logging.getLogger(__name__)
+
+app = FastAPI(title="HF Model Ecosystem API", version="2.0.0")
 
 app.add_middleware(GZipMiddleware, minimum_size=1000)
 
+CORS_HEADERS = {
+    "Access-Control-Allow-Origin": "*",
+    "Access-Control-Allow-Methods": "*",
+    "Access-Control-Allow-Headers": "*",
+}
+
 @app.exception_handler(Exception)
 async def global_exception_handler(request: Request, exc: Exception):
-    """Global exception handler that ensures CORS headers are included even on errors."""
-    import traceback
-    error_detail = str(exc)
-    traceback_str = traceback.format_exc()
-    import sys
-    sys.stderr.write(f"Unhandled exception: {error_detail}\n{traceback_str}\n")
+    logger.exception("Unhandled exception", exc_info=exc)
     return JSONResponse(
         status_code=500,
-        content={"detail": error_detail, "error": "Internal server error"},
-        headers={
-            "Access-Control-Allow-Origin": "*",
-            "Access-Control-Allow-Methods": "*",
-            "Access-Control-Allow-Headers": "*",
-        }
+        content={"detail": "Internal server error"},
+        headers=CORS_HEADERS,
     )
 
 @app.exception_handler(StarletteHTTPException)
 async def http_exception_handler(request: Request, exc: StarletteHTTPException):
-    """HTTP exception handler with CORS headers."""
     return JSONResponse(
         status_code=exc.status_code,
         content={"detail": exc.detail},
-        headers={
-            "Access-Control-Allow-Origin": "*",
-            "Access-Control-Allow-Methods": "*",
-            "Access-Control-Allow-Headers": "*",
-        }
+        headers=CORS_HEADERS,
     )
 
 @app.exception_handler(RequestValidationError)
 async def validation_exception_handler(request: Request, exc: RequestValidationError):
-    """Validation exception handler with CORS headers."""
     return JSONResponse(
         status_code=422,
         content={"detail": exc.errors()},
-        headers={
-            "Access-Control-Allow-Origin": "*",
-            "Access-Control-Allow-Methods": "*",
-            "Access-Control-Allow-Headers": "*",
-        }
+        headers=CORS_HEADERS,
     )
 
-# CORS middleware for React frontend
-# Update allow_origins with your Netlify URL in production
-# Note: Add your specific Netlify URL after deployment
-FRONTEND_URL = os.getenv("FRONTEND_URL", "http://localhost:3000")
-# Allow all origins for development (restrict in production)
-ALLOW_ALL_ORIGINS = os.getenv("ALLOW_ALL_ORIGINS", "true").lower() == "true"
-if ALLOW_ALL_ORIGINS:
+if settings.ALLOW_ALL_ORIGINS:
     app.add_middleware(
         CORSMiddleware,
-        allow_origins=["*"],  # Allow all origins in development
-        allow_credentials=False,  # Must be False when allow_origins is ["*"]
+        allow_origins=["*"],
+        allow_credentials=False,
         allow_methods=["*"],
         allow_headers=["*"],
     )
 else:
     app.add_middleware(
         CORSMiddleware,
-        allow_origins=[
-            "http://localhost:3000",  # Local development
-            FRONTEND_URL,  # Production frontend URL
-            # Add your Netlify URL here after deployment, e.g.:
-            # "https://your-app-name.netlify.app",
-        ],
+        allow_origins=["http://localhost:3000", settings.FRONTEND_URL],
         allow_credentials=True,
         allow_methods=["*"],
         allow_headers=["*"],
     )
 
-data_loader = ModelDataLoader()
-embedder: Optional[ModelEmbedder] = None
-reducer: Optional[DimensionReducer] = None
-df: Optional[pd.DataFrame] = None
-embeddings: Optional[np.ndarray] = None
-reduced_embeddings: Optional[np.ndarray] = None
-cluster_labels: Optional[np.ndarray] = None  # Cached cluster assignments
-
-
-class FilterParams(BaseModel):
-    min_downloads: int = 0
-    min_likes: int = 0
-    search_query: Optional[str] = None
-    libraries: Optional[List[str]] = None
-    pipeline_tags: Optional[List[str]] = None
-
-
-class ModelPoint(BaseModel):
-    model_id: str
-    x: float
-    y: float
-    z: float  # 3D coordinate
-    library_name: Optional[str]
-    pipeline_tag: Optional[str]
-    downloads: int
-    likes: int
-    trending_score: Optional[float]
-    tags: Optional[str]
-    parent_model: Optional[str] = None
-    licenses: Optional[str] = None
-    family_depth: Optional[int] = None  # Generation depth in family tree (0 = root)
-    cluster_id: Optional[int] = None    # Cluster assignment for visualization
 
+# Include routers
+app.include_router(models.router)
+app.include_router(stats.router)
+app.include_router(clusters.router)
 
 @app.on_event("startup")
 async def startup_event():
-    """Initialize data and models on startup with caching."""
-    global df, embedder, reducer, embeddings, reduced_embeddings
+    # All variables are accessed via deps module, no need for global declarations
     
-    import os
     backend_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
     root_dir = os.path.dirname(backend_dir)
     cache_dir = os.path.join(root_dir, "cache")
     os.makedirs(cache_dir, exist_ok=True)
     
     embeddings_cache = os.path.join(cache_dir, "embeddings.pkl")
+    graph_embeddings_cache = os.path.join(cache_dir, "graph_embeddings.pkl")
+    combined_embeddings_cache = os.path.join(cache_dir, "combined_embeddings.pkl")
     reduced_cache_umap = os.path.join(cache_dir, "reduced_umap_3d.pkl")
+    reduced_cache_umap_graph = os.path.join(cache_dir, "reduced_umap_3d_graph.pkl")
     reducer_cache_umap = os.path.join(cache_dir, "reducer_umap_3d.pkl")
+    reducer_cache_umap_graph = os.path.join(cache_dir, "reducer_umap_3d_graph.pkl")
     
-    sample_size_env = os.getenv("SAMPLE_SIZE")
-    if sample_size_env is None:
-        sample_size = None
+    sample_size = settings.get_sample_size()
+    if sample_size:
+        logger.info(f"Loading limited dataset: {sample_size} models (SAMPLE_SIZE={sample_size})")
     else:
-        sample_size = int(sample_size_env)
-        if sample_size == 0:
-            sample_size = None
-    df = data_loader.load_data(sample_size=sample_size)
-    df = data_loader.preprocess_for_embedding(df)
-    
-    if 'model_id' in df.columns:
-        df.set_index('model_id', drop=False, inplace=True)
+        logger.info("No SAMPLE_SIZE set, loading full dataset")
+    
+    deps.df = deps.data_loader.load_data(sample_size=sample_size)
+    deps.df = deps.data_loader.preprocess_for_embedding(deps.df)
+    
+    if 'model_id' in deps.df.columns:
+        deps.df.set_index('model_id', drop=False, inplace=True)
     for col in ['downloads', 'likes']:
-        if col in df.columns:
-            df[col] = pd.to_numeric(df[col], errors='coerce').fillna(0).astype(int)
+        if col in deps.df.columns:
+            deps.df[col] = pd.to_numeric(deps.df[col], errors='coerce').fillna(0).astype(int)
     
-    embedder = ModelEmbedder()
+    deps.embedder = ModelEmbedder()
     
+    # Load or generate text embeddings
     if os.path.exists(embeddings_cache):
         try:
-            embeddings = embedder.load_embeddings(embeddings_cache)
+            deps.embeddings = deps.embedder.load_embeddings(embeddings_cache)
+        except (IOError, pickle.UnpicklingError, EOFError) as e:
+            logger.warning(f"Failed to load cached embeddings: {e}")
+            deps.embeddings = None
+    
+    if deps.embeddings is None:
+        texts = deps.df['combined_text'].tolist()
+        deps.embeddings = deps.embedder.generate_embeddings(texts, batch_size=128)
+        deps.embedder.save_embeddings(deps.embeddings, embeddings_cache)
+    
+    # Initialize graph embedder and generate graph embeddings (optional, lazy-loaded)
+    if settings.USE_GRAPH_EMBEDDINGS:
+        try:
+            deps.graph_embedder = GraphEmbedder()
+            logger.info("Building family graph for graph embeddings...")
+            graph = deps.graph_embedder.build_family_graph(deps.df)
+            
+            if os.path.exists(graph_embeddings_cache):
+                try:
+                    deps.graph_embeddings_dict = deps.graph_embedder.load_embeddings(graph_embeddings_cache)
+                    logger.info(f"Loaded cached graph embeddings for {len(deps.graph_embeddings_dict)} models")
+                except (IOError, pickle.UnpicklingError, EOFError) as e:
+                    logger.warning(f"Failed to load cached graph embeddings: {e}")
+                    deps.graph_embeddings_dict = None
+            
+            if deps.graph_embeddings_dict is None or len(deps.graph_embeddings_dict) == 0:
+                logger.info("Generating graph embeddings (this may take a while)...")
+                deps.graph_embeddings_dict = deps.graph_embedder.generate_graph_embeddings(graph, workers=4)
+                if deps.graph_embeddings_dict:
+                    deps.graph_embedder.save_embeddings(deps.graph_embeddings_dict, graph_embeddings_cache)
+                    logger.info(f"Generated graph embeddings for {len(deps.graph_embeddings_dict)} models")
+            
+            # Combine text and graph embeddings
+            if deps.graph_embeddings_dict and len(deps.graph_embeddings_dict) > 0:
+                model_ids = deps.df['model_id'].astype(str).tolist()
+                if os.path.exists(combined_embeddings_cache):
+                    try:
+                        with open(combined_embeddings_cache, 'rb') as f:
+                            deps.combined_embeddings = pickle.load(f)
+                        logger.info("Loaded cached combined embeddings")
+                    except (IOError, pickle.UnpicklingError, EOFError) as e:
+                        logger.warning(f"Failed to load cached combined embeddings: {e}")
+                        deps.combined_embeddings = None
+                
+                if deps.combined_embeddings is None:
+                    logger.info("Combining text and graph embeddings...")
+                    deps.combined_embeddings = deps.graph_embedder.combine_embeddings(
+                        deps.embeddings, deps.graph_embeddings_dict, model_ids,
+                        text_weight=0.7, graph_weight=0.3
+                    )
+                    with open(combined_embeddings_cache, 'wb') as f:
+                        pickle.dump(deps.combined_embeddings, f)
+                    logger.info("Combined embeddings saved")
         except Exception as e:
-            embeddings = None
-    
-    if embeddings is None:
-        texts = df['combined_text'].tolist()
-        embeddings = embedder.generate_embeddings(texts, batch_size=128)
-        embedder.save_embeddings(embeddings, embeddings_cache)
+            logger.warning(f"Graph embeddings not available: {e}. Continuing with text-only embeddings.")
+            deps.graph_embedder = None
+            deps.graph_embeddings_dict = None
+            deps.combined_embeddings = None
     
-    reducer = DimensionReducer(method="umap", n_components=3)
+    # Initialize reducer for text embeddings
+    deps.reducer = DimensionReducer(method="umap", n_components=3)
     
     if os.path.exists(reduced_cache_umap) and os.path.exists(reducer_cache_umap):
         try:
-            import pickle
             with open(reduced_cache_umap, 'rb') as f:
-                reduced_embeddings = pickle.load(f)
-            reducer.load_reducer(reducer_cache_umap)
-        except Exception as e:
-            reduced_embeddings = None
-    
-    if reduced_embeddings is None:
-        reducer.reducer = UMAP(
+                deps.reduced_embeddings = pickle.load(f)
+            deps.reducer.load_reducer(reducer_cache_umap)
+        except (IOError, pickle.UnpicklingError, EOFError) as e:
+            logger.warning(f"Failed to load cached reduced embeddings: {e}")
+            deps.reduced_embeddings = None
+    
+    if deps.reduced_embeddings is None:
+        deps.reducer.reducer = UMAP(
             n_components=3,
             n_neighbors=30,
             min_dist=0.3,
@@ -206,61 +220,57 @@ async def startup_event():
             low_memory=True,
             spread=1.5
         )
-        reduced_embeddings = reducer.fit_transform(embeddings)
-        import pickle
+        deps.reduced_embeddings = deps.reducer.fit_transform(deps.embeddings)
         with open(reduced_cache_umap, 'wb') as f:
-            pickle.dump(reduced_embeddings, f)
-        reducer.save_reducer(reducer_cache_umap)
-
-
-def calculate_family_depths(df: pd.DataFrame) -> Dict[str, int]:
-    """
-    Calculate family tree depth for each model.
-    Returns a dictionary mapping model_id to depth (0 = root, 1 = first generation, etc.)
-    """
-    depths = {}
-    visited = set()
+            pickle.dump(deps.reduced_embeddings, f)
+        deps.reducer.save_reducer(reducer_cache_umap)
     
-    def get_depth(model_id: str) -> int:
-        if model_id in depths:
-            return depths[model_id]
-        if model_id in visited:
-            # Circular reference, treat as root
-            depths[model_id] = 0
-            return 0
+    # Initialize reducer for graph-aware embeddings if available
+    if deps.combined_embeddings is not None:
+        reducer_graph = DimensionReducer(method="umap", n_components=3)
         
-        visited.add(model_id)
-        
-        if model_id not in df.index:
-            depths[model_id] = 0
-            return 0
-        
-        parent_id = df.loc[model_id].get('parent_model')
-        if parent_id and pd.notna(parent_id) and str(parent_id) != 'nan' and str(parent_id) != '':
-            parent_id_str = str(parent_id)
-            if parent_id_str in df.index:
-                depth = get_depth(parent_id_str) + 1
-            else:
-                depth = 0  # Parent not in dataset, treat as root
-        else:
-            depth = 0  # No parent, this is a root
+        if os.path.exists(reduced_cache_umap_graph) and os.path.exists(reducer_cache_umap_graph):
+            try:
+                with open(reduced_cache_umap_graph, 'rb') as f:
+                    deps.reduced_embeddings_graph = pickle.load(f)
+                reducer_graph.load_reducer(reducer_cache_umap_graph)
+            except (IOError, pickle.UnpicklingError, EOFError) as e:
+                logger.warning(f"Failed to load cached graph-aware reduced embeddings: {e}")
+                deps.reduced_embeddings_graph = None
         
-        depths[model_id] = depth
-        return depth
-    
-    for model_id in df.index:
-        if model_id not in depths:
-            visited = set()  # Reset for each tree
-            get_depth(model_id)
+        if deps.reduced_embeddings_graph is None:
+            reducer_graph.reducer = UMAP(
+                n_components=3,
+                n_neighbors=30,
+                min_dist=0.3,
+                metric='cosine',
+                random_state=42,
+                n_jobs=-1,
+                low_memory=True,
+                spread=1.5
+            )
+            deps.reduced_embeddings_graph = reducer_graph.fit_transform(deps.combined_embeddings)
+            with open(reduced_cache_umap_graph, 'wb') as f:
+                pickle.dump(deps.reduced_embeddings_graph, f)
+            reducer_graph.save_reducer(reducer_cache_umap_graph)
+            logger.info("Graph-aware embeddings reduced and cached")
     
-    return depths
+    # Update module-level aliases
+    df = deps.df
+    embedder = deps.embedder
+    graph_embedder = deps.graph_embedder
+    reducer = deps.reducer
+    embeddings = deps.embeddings
+    graph_embeddings_dict = deps.graph_embeddings_dict
+    combined_embeddings = deps.combined_embeddings
+    reduced_embeddings = deps.reduced_embeddings
+    reduced_embeddings_graph = deps.reduced_embeddings_graph
+
+
+from utils.family_tree import calculate_family_depths
 
 
 def compute_clusters(reduced_embeddings: np.ndarray, n_clusters: int = 50) -> np.ndarray:
-    """
-    Compute clusters using KMeans on reduced embeddings.
-    Returns cluster labels for each point.
-    """
     from sklearn.cluster import KMeans
     
     n_samples = len(reduced_embeddings)
@@ -268,8 +278,7 @@ def compute_clusters(reduced_embeddings: np.ndarray, n_clusters: int = 50) -> np
         n_clusters = max(1, n_samples // 10)
     
     kmeans = KMeans(n_clusters=n_clusters, random_state=42, n_init=10)
-    cluster_labels = kmeans.fit_predict(reduced_embeddings)
-    return cluster_labels
+    return kmeans.fit_predict(reduced_embeddings)
 
 
 @app.get("/")
@@ -284,24 +293,16 @@ async def get_models(
     search_query: Optional[str] = Query(None),
     color_by: str = Query("library_name"),
     size_by: str = Query("downloads"),
-    max_points: Optional[int] = Query(None),  # Optional limit (None = all points)
-    projection_method: str = Query("umap"),  # umap or tsne
-    base_models_only: bool = Query(False)  # Only show root models (no parent)
+    max_points: Optional[int] = Query(None),
+    projection_method: str = Query("umap"),
+    base_models_only: bool = Query(False),
+    max_hierarchy_depth: Optional[int] = Query(None, ge=0, description="Filter to models at or below this hierarchy depth."),
+    use_graph_embeddings: bool = Query(False, description="Use graph-aware embeddings that respect family tree structure")
 ):
-    """
-    Get filtered models with 3D coordinates for visualization.
-    Supports multiple projection methods: UMAP or t-SNE.
-    If base_models_only=True, only returns root models (models without a parent_model).
-    
-    Returns a JSON object with:
-    - models: List of ModelPoint objects
-    - filtered_count: Number of models matching filters (before max_points sampling)
-    - returned_count: Number of models actually returned (after max_points sampling)
-    """
-    global df, embedder, reducer, embeddings, reduced_embeddings
+    if deps.df is None:
+        raise DataNotLoadedError()
     
-    if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+    df = deps.df
     
     # Filter data
     filtered_df = data_loader.filter_data(
@@ -321,7 +322,12 @@ async def get_models(
                 (filtered_df['parent_model'].astype(str) == 'nan')
             ]
     
-    # Store the filtered count BEFORE sampling
+    if max_hierarchy_depth is not None:
+        family_depths = calculate_family_depths(df)
+        filtered_df = filtered_df[
+            filtered_df['model_id'].astype(str).map(lambda x: family_depths.get(x, 0) <= max_hierarchy_depth)
+        ]
+    
     filtered_count = len(filtered_df)
     
     if len(filtered_df) == 0:
@@ -332,42 +338,53 @@ async def get_models(
         }
     
     if max_points is not None and len(filtered_df) > max_points:
-        # Use stratified sampling to preserve distribution of important attributes
-        # Sample proportionally from different libraries/pipelines for better representation
         if 'library_name' in filtered_df.columns and filtered_df['library_name'].notna().any():
-            # Stratified sampling by library
-            filtered_df = filtered_df.groupby('library_name', group_keys=False).apply(
-                lambda x: x.sample(min(len(x), max(1, int(max_points * len(x) / len(filtered_df)))), random_state=42)
-            ).reset_index(drop=True)
-            # If still too many, random sample the rest
+            # Sample proportionally by library, preserving all columns
+            sampled_dfs = []
+            for lib_name, group in filtered_df.groupby('library_name', group_keys=False):
+                n_samples = max(1, int(max_points * len(group) / len(filtered_df)))
+                sampled_dfs.append(group.sample(min(len(group), n_samples), random_state=42))
+            filtered_df = pd.concat(sampled_dfs, ignore_index=True)
             if len(filtered_df) > max_points:
-                filtered_df = filtered_df.sample(n=max_points, random_state=42)
+                filtered_df = filtered_df.sample(n=max_points, random_state=42).reset_index(drop=True)
+            else:
+                filtered_df = filtered_df.reset_index(drop=True)
         else:
-            filtered_df = filtered_df.sample(n=max_points, random_state=42)
-    
-    if embeddings is None:
-        raise HTTPException(status_code=503, detail="Embeddings not loaded")
+            filtered_df = filtered_df.sample(n=max_points, random_state=42).reset_index(drop=True)
     
-    if reduced_embeddings is None or (reducer and reducer.method != projection_method.lower()):
-        import os
+    # Determine which embeddings to use
+    if use_graph_embeddings and combined_embeddings is not None:
+        current_embeddings = combined_embeddings
+        current_reduced = reduced_embeddings_graph
+        embedding_type = "graph-aware"
+    else:
+        if embeddings is None:
+            raise EmbeddingsNotReadyError()
+        current_embeddings = embeddings
+        current_reduced = reduced_embeddings
+        embedding_type = "text-only"
+    
+    # Handle reduced embeddings loading/generation
+    if current_reduced is None or (reducer and reducer.method != projection_method.lower()):
         backend_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
         root_dir = os.path.dirname(backend_dir)
         cache_dir = os.path.join(root_dir, "cache")
-        reduced_cache = os.path.join(cache_dir, f"reduced_{projection_method.lower()}_3d.pkl")
-        reducer_cache = os.path.join(cache_dir, f"reducer_{projection_method.lower()}_3d.pkl")
+        cache_suffix = "_graph" if use_graph_embeddings and combined_embeddings is not None else ""
+        reduced_cache = os.path.join(cache_dir, f"reduced_{projection_method.lower()}_3d{cache_suffix}.pkl")
+        reducer_cache = os.path.join(cache_dir, f"reducer_{projection_method.lower()}_3d{cache_suffix}.pkl")
         
         if os.path.exists(reduced_cache) and os.path.exists(reducer_cache):
             try:
-                import pickle
                 with open(reduced_cache, 'rb') as f:
-                    reduced_embeddings = pickle.load(f)
+                    current_reduced = pickle.load(f)
                 if reducer is None or reducer.method != projection_method.lower():
                     reducer = DimensionReducer(method=projection_method.lower(), n_components=3)
                 reducer.load_reducer(reducer_cache)
-            except Exception as e:
-                reduced_embeddings = None
+            except (IOError, pickle.UnpicklingError, EOFError) as e:
+                logger.warning(f"Failed to load cached reduced embeddings: {e}")
+                current_reduced = None
         
-        if reduced_embeddings is None:
+        if current_reduced is None:
             if reducer is None or reducer.method != projection_method.lower():
                 reducer = DimensionReducer(method=projection_method.lower(), n_components=3)
                 if projection_method.lower() == "umap":
@@ -381,52 +398,91 @@ async def get_models(
                         low_memory=True,
                         spread=1.5
                     )
-            reduced_embeddings = reducer.fit_transform(embeddings)
-            import pickle
+            current_reduced = reducer.fit_transform(current_embeddings)
             with open(reduced_cache, 'wb') as f:
-                pickle.dump(reduced_embeddings, f)
+                pickle.dump(current_reduced, f)
             reducer.save_reducer(reducer_cache)
+            
+            # Update global variable
+            if use_graph_embeddings and deps.combined_embeddings is not None:
+                deps.reduced_embeddings_graph = current_reduced
+            else:
+                deps.reduced_embeddings = current_reduced
+    
+    # Get indices for filtered data
+    # Use model_id column to map between filtered_df and original df
+    # This is safer than using index positions which can change after filtering
+    filtered_model_ids = filtered_df['model_id'].astype(str).values
     
-    # Get coordinates for filtered data - optimized vectorized approach
-    # Map filtered dataframe indices to original dataframe integer positions
-    # Since df is indexed by model_id, we need to get the integer positions
+    # Map model_ids to positions in original df
     if df.index.name == 'model_id' or 'model_id' in df.index.names:
-        # Get integer positions of filtered rows in original dataframe
-        # Use vectorized lookup for better performance
-        filtered_indices = np.array([df.index.get_loc(idx) for idx in filtered_df.index], dtype=np.int32)
+        # When df is indexed by model_id, use get_loc directly
+        filtered_indices = []
+        for model_id in filtered_model_ids:
+            try:
+                pos = df.index.get_loc(model_id)
+                # Handle both single position and array of positions
+                if isinstance(pos, (int, np.integer)):
+                    filtered_indices.append(int(pos))
+                elif isinstance(pos, (slice, np.ndarray)):
+                    # If multiple matches, take first
+                    if isinstance(pos, slice):
+                        filtered_indices.append(int(pos.start))
+                    else:
+                        filtered_indices.append(int(pos[0]))
+            except (KeyError, TypeError):
+                continue
+        filtered_indices = np.array(filtered_indices, dtype=np.int32)
     else:
-        # If using integer index, use directly
-        filtered_indices = filtered_df.index.values.astype(np.int32)
-    
-    # Use advanced indexing for faster access
-    filtered_reduced = reduced_embeddings[filtered_indices]
+        # When df is not indexed by model_id, find positions by matching model_id column
+        df_model_ids = df['model_id'].astype(str).values
+        model_id_to_pos = {mid: pos for pos, mid in enumerate(df_model_ids)}
+        filtered_indices = np.array([
+            model_id_to_pos[mid] for mid in filtered_model_ids 
+            if mid in model_id_to_pos
+        ], dtype=np.int32)
+    
+    if len(filtered_indices) == 0:
+        return {
+            "models": [],
+            "embedding_type": embedding_type,
+            "filtered_count": filtered_count,
+            "returned_count": 0
+        }
     
+    filtered_reduced = current_reduced[filtered_indices]
     family_depths = calculate_family_depths(df)
     
-    global cluster_labels
-    if cluster_labels is None or len(cluster_labels) != len(reduced_embeddings):
-        cluster_labels = compute_clusters(reduced_embeddings, n_clusters=min(50, len(reduced_embeddings) // 100))
+    # Use appropriate embeddings for clustering
+    clustering_embeddings = current_reduced
+    # Compute clusters if not already computed or if size changed
+    if models.cluster_labels is None or len(models.cluster_labels) != len(clustering_embeddings):
+        models.cluster_labels = compute_clusters(clustering_embeddings, n_clusters=min(50, len(clustering_embeddings) // 100))
     
-    filtered_clusters = cluster_labels[filtered_indices]
+    # Handle case where cluster_labels might not match filtered data yet
+    if models.cluster_labels is not None and len(models.cluster_labels) > 0:
+        if len(filtered_indices) <= len(models.cluster_labels):
+            filtered_clusters = models.cluster_labels[filtered_indices]
+        else:
+            # Fallback: use first cluster for all if indices don't match
+            filtered_clusters = np.zeros(len(filtered_indices), dtype=int)
+    else:
+        filtered_clusters = np.zeros(len(filtered_indices), dtype=int)
     
-    # Build response with optimized vectorized operations
-    # Pre-extract arrays for faster access
     model_ids = filtered_df['model_id'].astype(str).values
-    library_names = filtered_df['library_name'].values
-    pipeline_tags = filtered_df['pipeline_tag'].values
-    downloads_arr = filtered_df['downloads'].fillna(0).astype(int).values
-    likes_arr = filtered_df['likes'].fillna(0).astype(int).values
-    trending_scores = filtered_df.get('trendingScore', pd.Series()).values
-    tags_arr = filtered_df.get('tags', pd.Series()).values
-    parent_models = filtered_df.get('parent_model', pd.Series()).values
-    licenses_arr = filtered_df.get('licenses', pd.Series()).values
-    
-    # Vectorized coordinate extraction
+    library_names = filtered_df.get('library_name', pd.Series([None] * len(filtered_df))).values
+    pipeline_tags = filtered_df.get('pipeline_tag', pd.Series([None] * len(filtered_df))).values
+    downloads_arr = filtered_df.get('downloads', pd.Series([0] * len(filtered_df))).fillna(0).astype(int).values
+    likes_arr = filtered_df.get('likes', pd.Series([0] * len(filtered_df))).fillna(0).astype(int).values
+    trending_scores = filtered_df.get('trendingScore', pd.Series([None] * len(filtered_df))).values
+    tags_arr = filtered_df.get('tags', pd.Series([None] * len(filtered_df))).values
+    parent_models = filtered_df.get('parent_model', pd.Series([None] * len(filtered_df))).values
+    licenses_arr = filtered_df.get('licenses', pd.Series([None] * len(filtered_df))).values
+    created_at_arr = filtered_df.get('createdAt', pd.Series([None] * len(filtered_df))).values
+    
     x_coords = filtered_reduced[:, 0].astype(float)
     y_coords = filtered_reduced[:, 1].astype(float)
     z_coords = filtered_reduced[:, 2].astype(float) if filtered_reduced.shape[1] > 2 else np.zeros(len(filtered_reduced), dtype=float)
-    
-    # Build models list with optimized operations
     models = [
         ModelPoint(
             model_id=model_ids[idx],
@@ -442,28 +498,42 @@ async def get_models(
             parent_model=parent_models[idx] if idx < len(parent_models) and pd.notna(parent_models[idx]) else None,
             licenses=licenses_arr[idx] if idx < len(licenses_arr) and pd.notna(licenses_arr[idx]) else None,
             family_depth=family_depths.get(model_ids[idx], None),
-            cluster_id=int(filtered_clusters[idx]) if idx < len(filtered_clusters) else None
+            cluster_id=int(filtered_clusters[idx]) if idx < len(filtered_clusters) else None,
+            created_at=str(created_at_arr[idx]) if idx < len(created_at_arr) and pd.notna(created_at_arr[idx]) else None
         )
         for idx in range(len(filtered_df))
     ]
     
-    return models
+    # Return models with metadata about embedding type
+    return {
+        "models": models,
+        "embedding_type": embedding_type,
+        "filtered_count": filtered_count,
+        "returned_count": len(models)
+    }
 
 
 @app.get("/api/stats")
 async def get_stats():
     """Get dataset statistics."""
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
-    # Use len(df.index) to handle both regular and indexed DataFrames correctly
     total_models = len(df.index) if hasattr(df, 'index') else len(df)
     
+    # Get unique licenses with counts
+    licenses = {}
+    if 'license' in df.columns:
+        license_counts = df['license'].value_counts().to_dict()
+        licenses = {str(k): int(v) for k, v in license_counts.items() if pd.notna(k) and str(k) != 'nan'}
+    
     return {
         "total_models": total_models,
         "unique_libraries": int(df['library_name'].nunique()) if 'library_name' in df.columns else 0,
         "unique_pipelines": int(df['pipeline_tag'].nunique()) if 'pipeline_tag' in df.columns else 0,
         "unique_task_types": int(df['pipeline_tag'].nunique()) if 'pipeline_tag' in df.columns else 0,  # Alias for clarity
+        "unique_licenses": len(licenses),
+        "licenses": licenses,  # License name -> count mapping
         "avg_downloads": float(df['downloads'].mean()) if 'downloads' in df.columns else 0,
         "avg_likes": float(df['likes'].mean()) if 'likes' in df.columns else 0
     }
@@ -473,7 +543,7 @@ async def get_stats():
 async def get_model_details(model_id: str):
     """Get detailed information about a specific model."""
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     model = df[df.get('model_id', '') == model_id]
     if len(model) == 0:
@@ -481,11 +551,9 @@ async def get_model_details(model_id: str):
     
     model = model.iloc[0]
     
-    # Extract arXiv IDs from tags
     tags_str = str(model.get('tags', '')) if pd.notna(model.get('tags')) else ''
     arxiv_ids = extract_arxiv_ids(tags_str)
     
-    # Fetch arXiv papers if any IDs found
     papers = []
     if arxiv_ids:
         papers = await fetch_arxiv_papers(arxiv_ids[:5])  # Limit to 5 papers
@@ -505,6 +573,8 @@ async def get_model_details(model_id: str):
     }
 
 
+# Clusters endpoint is handled by routes/clusters.py router
+
 @app.get("/api/family/stats")
 async def get_family_stats():
     """
@@ -512,9 +582,8 @@ async def get_family_stats():
     Returns family size distribution, depth statistics, model card length by depth, etc.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
-    # Calculate family sizes
     family_sizes = {}
     root_models = set()
     
@@ -528,14 +597,13 @@ async def get_family_stats():
                 family_sizes[model_id] = 0
         else:
             parent_id_str = str(parent_id)
-            # Find root of this family
             root = parent_id_str
             visited = set()
             while root in df.index and pd.notna(df.loc[root].get('parent_model')):
                 parent = df.loc[root].get('parent_model')
                 if pd.isna(parent) or str(parent) == 'nan' or str(parent) == '':
                     break
-                if str(parent) in visited:  # Circular reference
+                if str(parent) in visited:
                     break
                 visited.add(root)
                 root = str(parent)
@@ -544,18 +612,15 @@ async def get_family_stats():
                 family_sizes[root] = 0
             family_sizes[root] += 1
     
-    # Count family sizes
     size_distribution = {}
     for root, size in family_sizes.items():
         size_distribution[size] = size_distribution.get(size, 0) + 1
     
-    # Calculate depth statistics
     depths = calculate_family_depths(df)
     depth_counts = {}
     for depth in depths.values():
         depth_counts[depth] = depth_counts.get(depth, 0) + 1
     
-    # Calculate model card length by depth
     model_card_lengths_by_depth = {}
     if 'modelCard' in df.columns:
         for idx, row in df.iterrows():
@@ -568,7 +633,6 @@ async def get_family_stats():
                     model_card_lengths_by_depth[depth] = []
                 model_card_lengths_by_depth[depth].append(card_length)
     
-    # Calculate statistics for each depth
     model_card_stats = {}
     for depth, lengths in model_card_lengths_by_depth.items():
         if lengths:
@@ -593,99 +657,218 @@ async def get_family_stats():
     }
 
 
+@app.get("/api/family/path/{model_id}")
+async def get_family_path(
+    model_id: str,
+    target_id: Optional[str] = Query(None, description="Target model ID. If None, returns path to root.")
+):
+    """
+    Get path from model to root or to target model.
+    Returns list of model IDs representing the path.
+    """
+    if df is None:
+        raise DataNotLoadedError()
+    
+    model_id_str = str(model_id)
+    
+    if df.index.name == 'model_id':
+        if model_id_str not in df.index:
+            raise HTTPException(status_code=404, detail="Model not found")
+    else:
+        model_rows = df[df.get('model_id', '') == model_id_str]
+        if len(model_rows) == 0:
+            raise HTTPException(status_code=404, detail="Model not found")
+    
+    path = [model_id_str]
+    visited = set([model_id_str])
+    current = model_id_str
+    
+    if target_id:
+        target_str = str(target_id)
+        if df.index.name == 'model_id':
+            if target_str not in df.index:
+                raise HTTPException(status_code=404, detail="Target model not found")
+        
+        while current != target_str and current not in visited:
+            try:
+                if df.index.name == 'model_id':
+                    row = df.loc[current]
+                else:
+                    rows = df[df.get('model_id', '') == current]
+                    if len(rows) == 0:
+                        break
+                    row = rows.iloc[0]
+                
+                parent_id = row.get('parent_model')
+                if parent_id and pd.notna(parent_id):
+                    parent_str = str(parent_id)
+                    if parent_str == target_str:
+                        path.append(parent_str)
+                        break
+                    if parent_str not in visited:
+                        path.append(parent_str)
+                        visited.add(parent_str)
+                        current = parent_str
+                    else:
+                        break
+                else:
+                    break
+            except (KeyError, IndexError):
+                break
+    else:
+        while True:
+            try:
+                if df.index.name == 'model_id':
+                    row = df.loc[current]
+                else:
+                    rows = df[df.get('model_id', '') == current]
+                    if len(rows) == 0:
+                        break
+                    row = rows.iloc[0]
+                
+                parent_id = row.get('parent_model')
+                if parent_id and pd.notna(parent_id):
+                    parent_str = str(parent_id)
+                    if parent_str not in visited:
+                        path.append(parent_str)
+                        visited.add(parent_str)
+                        current = parent_str
+                    else:
+                        break
+                else:
+                    break
+            except (KeyError, IndexError):
+                break
+    
+    return {
+        "path": path,
+        "source": model_id_str,
+        "target": target_id if target_id else "root",
+        "path_length": len(path) - 1
+    }
+
+
 @app.get("/api/family/{model_id}")
-async def get_family_tree(model_id: str, max_depth: int = Query(5, ge=1, le=10)):
+async def get_family_tree(
+    model_id: str, 
+    max_depth: Optional[int] = Query(None, ge=1, le=100, description="Maximum depth to traverse. If None, traverses entire tree without limit."),
+    max_depth_filter: Optional[int] = Query(None, ge=0, description="Filter results to models at or below this hierarchy depth.")
+):
     """
     Get family tree for a model (ancestors and descendants).
     Returns the model, its parent chain, and all children.
+    
+    If max_depth is None, traverses the entire family tree without depth limits.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
-    
-    # Find the model
-    model_row = df[df.get('model_id', '') == model_id]
-    if len(model_row) == 0:
-        raise HTTPException(status_code=404, detail="Model not found")
-    
-    family_models = []
-    visited = set()
+        raise DataNotLoadedError()
     
-    # Get coordinates for family members
     if reduced_embeddings is None:
         raise HTTPException(status_code=503, detail="Embeddings not ready")
     
-    # Optimize: create parent_model index for faster lookups
-    if 'parent_model' not in df.index.names and 'parent_model' in df.columns:
-        # Create a reverse index for faster parent lookups
-        parent_index = df[df['parent_model'].notna()].set_index('parent_model', drop=False, append=True)
+    model_id_str = str(model_id)
     
-    def get_ancestors(current_id: str, depth: int):
-        """Recursively get parent chain - optimized with index lookup."""
-        if depth <= 0 or current_id in visited:
+    if df.index.name == 'model_id':
+        if model_id_str not in df.index:
+            raise HTTPException(status_code=404, detail="Model not found")
+        model_lookup = df.loc
+    else:
+        model_rows = df[df.get('model_id', '') == model_id_str]
+        if len(model_rows) == 0:
+            raise HTTPException(status_code=404, detail="Model not found")
+        model_lookup = lambda x: df[df.get('model_id', '') == x]
+    
+    from utils.network_analysis import _get_all_parents, _parse_parent_list
+    
+    children_index: Dict[str, List[str]] = {}
+    parent_columns = ['parent_model', 'finetune_parent', 'quantized_parent', 'adapter_parent', 'merge_parent']
+    
+    for idx, row in df.iterrows():
+        model_id_from_row = str(row.get('model_id', idx))
+        all_parents = _get_all_parents(row)
+        
+        for rel_type, parent_list in all_parents.items():
+            for parent_str in parent_list:
+                if parent_str not in children_index:
+                    children_index[parent_str] = []
+                children_index[parent_str].append(model_id_from_row)
+    
+    visited = set()
+    
+    def get_ancestors(current_id: str, depth: Optional[int]):
+        if current_id in visited:
+            return
+        if depth is not None and depth <= 0:
             return
         visited.add(current_id)
         
-        # Use index lookup if available, otherwise fallback to query
-        if 'model_id' in df.index.names or df.index.name == 'model_id':
-            try:
-                model = df.loc[[current_id]]
-            except KeyError:
-                return
-        else:
-            model = df[df.get('model_id', '') == current_id]
-            if len(model) == 0:
-                return
-            model = model.iloc[[0]]
-        
-        parent_id = model.iloc[0].get('parent_model')
-        
-        if parent_id and pd.notna(parent_id) and str(parent_id) != 'nan':
-            get_ancestors(str(parent_id), depth - 1)
+        try:
+            if df.index.name == 'model_id':
+                row = df.loc[current_id]
+            else:
+                rows = model_lookup(current_id)
+                if len(rows) == 0:
+                    return
+                row = rows.iloc[0]
+            
+            all_parents = _get_all_parents(row)
+            for rel_type, parent_list in all_parents.items():
+                for parent_str in parent_list:
+                    if parent_str != 'nan' and parent_str != '':
+                        next_depth = depth - 1 if depth is not None else None
+                        get_ancestors(parent_str, next_depth)
+        except (KeyError, IndexError):
+            return
     
-    def get_descendants(current_id: str, depth: int):
-        """Recursively get all children - optimized with index lookup."""
-        if depth <= 0 or current_id in visited:
+    def get_descendants(current_id: str, depth: Optional[int]):
+        if current_id in visited:
+            return
+        if depth is not None and depth <= 0:
             return
         visited.add(current_id)
         
-        # Use optimized parent lookup
-        if 'parent_model' in df.columns:
-            children = df[df['parent_model'] == current_id]
-            # Use vectorized iteration
-            child_ids = children['model_id'].dropna().astype(str).unique()
-            for child_id in child_ids:
-                if child_id not in visited:
-                    get_descendants(child_id, depth - 1)
-    
-    # Get ancestors (parents)
-    get_ancestors(model_id, max_depth)
-    
-    # Get descendants (children)
-    visited = set()  # Reset for descendants
-    get_descendants(model_id, max_depth)
-    
-    # Add the root model
-    visited.add(model_id)
-    
-    # Get all family members with coordinates - optimized
-    if 'model_id' in df.index.names or df.index.name == 'model_id':
-        # Use index lookup if available
+        children = children_index.get(current_id, [])
+        for child_id in children:
+            if child_id not in visited:
+                next_depth = depth - 1 if depth is not None else None
+                get_descendants(child_id, next_depth)
+    
+    get_ancestors(model_id_str, max_depth)
+    visited = set()
+    get_descendants(model_id_str, max_depth)
+    visited.add(model_id_str)
+    
+    if df.index.name == 'model_id':
         try:
             family_df = df.loc[list(visited)]
         except KeyError:
-            # Fallback to isin if some IDs not in index
-            family_df = df[df.get('model_id', '').isin(visited)]
+            missing = [v for v in visited if v not in df.index]
+            if missing:
+                logger.warning(f"Some family members not found in index: {missing}")
+            family_df = df.loc[[v for v in visited if v in df.index]]
     else:
         family_df = df[df.get('model_id', '').isin(visited)]
     
-    family_indices = family_df.index.values  # Use values instead of tolist() for speed
+    if len(family_df) == 0:
+        raise HTTPException(status_code=404, detail="Family tree data not available")
+    
+    family_indices = family_df.index.values
+    if len(family_indices) > len(reduced_embeddings):
+        raise HTTPException(status_code=503, detail="Embedding indices mismatch")
+    
     family_reduced = reduced_embeddings[family_indices]
     
-    # Build family tree structure - optimized with vectorized operations
     family_map = {}
     for idx, (i, row) in enumerate(family_df.iterrows()):
-        model_id_val = str(row.get('model_id', 'Unknown'))
-        parent_id = row.get('parent_model') if pd.notna(row.get('parent_model')) else None
+        model_id_val = str(row.get('model_id', i))
+        parent_id = row.get('parent_model')
+        parent_id_str = str(parent_id) if parent_id and pd.notna(parent_id) else None
+        
+        depths = calculate_family_depths(df)
+        model_depth = depths.get(model_id_val, 0)
+        
+        if max_depth_filter is not None and model_depth > max_depth_filter:
+            continue
         
         family_map[model_id_val] = {
             "model_id": model_id_val,
@@ -696,12 +879,12 @@ async def get_family_tree(model_id: str, max_depth: int = Query(5, ge=1, le=10))
             "pipeline_tag": str(row.get('pipeline_tag')) if pd.notna(row.get('pipeline_tag')) else None,
             "downloads": int(row.get('downloads', 0)) if pd.notna(row.get('downloads')) else 0,
             "likes": int(row.get('likes', 0)) if pd.notna(row.get('likes')) else 0,
-            "parent_model": str(parent_id) if parent_id else None,
+            "parent_model": parent_id_str,
             "licenses": str(row.get('licenses')) if pd.notna(row.get('licenses')) else None,
+            "family_depth": model_depth,
             "children": []
         }
     
-    # Build tree structure
     root_models = []
     for model_id_val, model_data in family_map.items():
         parent_id = model_data["parent_model"]
@@ -711,7 +894,7 @@ async def get_family_tree(model_id: str, max_depth: int = Query(5, ge=1, le=10))
             root_models.append(model_id_val)
     
     return {
-        "root_model": model_id,
+        "root_model": model_id_str,
         "family": list(family_map.values()),
         "family_map": family_map,
         "root_models": root_models
@@ -720,7 +903,9 @@ async def get_family_tree(model_id: str, max_depth: int = Query(5, ge=1, le=10))
 
 @app.get("/api/search")
 async def search_models(
-    query: str = Query(..., min_length=1),
+    q: str = Query(..., min_length=1, alias="query"),
+    query: str = Query(None, min_length=1),
+    limit: int = Query(20, ge=1, le=100),
     graph_aware: bool = Query(False),
     include_neighbors: bool = Query(True)
 ):
@@ -729,47 +914,79 @@ async def search_models(
     Enhanced with graph-aware search option that includes network relationships.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
+    
+    # Support both 'q' and 'query' parameters
+    search_query = query or q
     
     if graph_aware:
-        # Use graph-aware search
         try:
             network_builder = ModelNetworkBuilder(df)
-            # Build network for top models (for performance)
             top_models = network_builder.get_top_models_by_field(n=1000)
             model_ids = [mid for mid, _ in top_models]
             graph = network_builder.build_cooccurrence_network(model_ids, cooccurrence_method='combined')
             
             results = network_builder.search_graph_aware(
-                query=query,
+                query=search_query,
                 graph=graph,
-                max_results=20,
+                max_results=limit,
                 include_neighbors=include_neighbors
             )
             
-            return {"results": results, "search_type": "graph_aware"}
-        except Exception as e:
-            pass
+            return {"results": results, "search_type": "graph_aware", "query": search_query}
+        except (ValueError, KeyError, AttributeError) as e:
+            logger.warning(f"Graph-aware search failed, falling back to basic search: {e}")
+    
+    query_lower = search_query.lower()
+    
+    # Enhanced search: search model_id, org, tags, library, pipeline
+    model_id_col = df.get('model_id', '').astype(str).str.lower()
+    library_col = df.get('library_name', '').astype(str).str.lower()
+    pipeline_col = df.get('pipeline_tag', '').astype(str).str.lower()
+    tags_col = df.get('tags', '').astype(str).str.lower()
+    license_col = df.get('license', '').astype(str).str.lower()
+    
+    # Extract org from model_id
+    org_col = model_id_col.str.split('/').str[0]
+    
+    # Multi-field search
+    mask = (
+        model_id_col.str.contains(query_lower, na=False) |
+        org_col.str.contains(query_lower, na=False) |
+        library_col.str.contains(query_lower, na=False) |
+        pipeline_col.str.contains(query_lower, na=False) |
+        tags_col.str.contains(query_lower, na=False) |
+        license_col.str.contains(query_lower, na=False)
+    )
     
-    query_lower = query.lower()
-    matches = df[
-        df.get('model_id', '').astype(str).str.lower().str.contains(query_lower, na=False)
-    ].head(20)  # Limit to 20 results
+    matches = df[mask].head(limit)
     
     results = []
     for _, row in matches.iterrows():
+        model_id = str(row.get('model_id', ''))
+        org = model_id.split('/')[0] if '/' in model_id else ''
+        
+        # Get coordinates if available
+        x = float(row.get('x', 0.0)) if 'x' in row else None
+        y = float(row.get('y', 0.0)) if 'y' in row else None
+        z = float(row.get('z', 0.0)) if 'z' in row else None
+        
         results.append({
-            "model_id": row.get('model_id'),
-            "title": row.get('model_id', '').split('/')[-1] if '/' in str(row.get('model_id', '')) else str(row.get('model_id', '')),
-            "library_name": row.get('library_name'),
-            "pipeline_tag": row.get('pipeline_tag'),
+            "model_id": model_id,
+            "x": x,
+            "y": y,
+            "z": z,
+            "org": org,
+            "library": row.get('library_name'),
+            "pipeline": row.get('pipeline_tag'),
+            "license": row.get('license') if pd.notna(row.get('license')) else None,
             "downloads": int(row.get('downloads', 0)),
             "likes": int(row.get('likes', 0)),
             "parent_model": row.get('parent_model') if pd.notna(row.get('parent_model')) else None,
             "match_type": "direct"
         })
     
-    return {"results": results, "search_type": "basic"}
+    return {"results": results, "search_type": "basic", "query": search_query}
 
 
 @app.get("/api/similar/{model_id}")
@@ -778,12 +995,12 @@ async def get_similar_models(model_id: str, k: int = Query(10, ge=1, le=50)):
     Get k-nearest neighbors of a model based on embedding similarity.
     Returns similar models with distance scores.
     """
-    global df, embedder, embeddings, reduced_embeddings
-    
-    if df is None or embeddings is None:
+    if deps.df is None or deps.embeddings is None:
         raise HTTPException(status_code=503, detail="Data not loaded")
     
-    # Find the model - optimized with index lookup
+    df = deps.df
+    embeddings = deps.embeddings
+    
     if 'model_id' in df.index.names or df.index.name == 'model_id':
         try:
             model_row = df.loc[[model_id]]
@@ -797,16 +1014,11 @@ async def get_similar_models(model_id: str, k: int = Query(10, ge=1, le=50)):
         model_idx = model_row.index[0]
     model_embedding = embeddings[model_idx]
     
-    # Calculate cosine similarity to all other models - optimized
     from sklearn.metrics.pairwise import cosine_similarity
-    # Use vectorized operations for better performance
     model_embedding_2d = model_embedding.reshape(1, -1)
     similarities = cosine_similarity(model_embedding_2d, embeddings)[0]
     
-    # Get top k similar models (excluding itself) - use argpartition for speed
-    # argpartition is faster than full sort for top-k
     top_k_indices = np.argpartition(similarities, -k-1)[-k-1:-1]
-    # Sort only the top k (much faster than sorting all)
     top_k_indices = top_k_indices[np.argsort(similarities[top_k_indices])][::-1]
     
     similar_models = []
@@ -817,7 +1029,7 @@ async def get_similar_models(model_id: str, k: int = Query(10, ge=1, le=50)):
         similar_models.append({
             "model_id": row.get('model_id', 'Unknown'),
             "similarity": float(similarities[idx]),
-            "distance": float(1 - similarities[idx]),  # Convert similarity to distance
+            "distance": float(1 - similarities[idx]),
             "library_name": row.get('library_name'),
             "pipeline_tag": row.get('pipeline_tag'),
             "downloads": int(row.get('downloads', 0)),
@@ -843,11 +1055,12 @@ async def get_models_by_semantic_similarity(
     Returns models with their similarity scores and coordinates.
     Useful for exploring the embedding space around a specific model.
     """
-    global df, embedder, embeddings, reduced_embeddings
-    
-    if df is None or embeddings is None:
+    if deps.df is None or deps.embeddings is None:
         raise HTTPException(status_code=503, detail="Data not loaded")
     
+    df = deps.df
+    embeddings = deps.embeddings
+    
     # Find the query model
     if 'model_id' in df.index.names or df.index.name == 'model_id':
         try:
@@ -863,7 +1076,6 @@ async def get_models_by_semantic_similarity(
     
     query_embedding = embeddings[model_idx]
     
-    # Filter by downloads/likes first for performance
     filtered_df = data_loader.filter_data(
         df=df,
         min_downloads=min_downloads,
@@ -873,32 +1085,26 @@ async def get_models_by_semantic_similarity(
         pipeline_tags=None
     )
     
-    # Get indices of filtered models
     if df.index.name == 'model_id' or 'model_id' in df.index.names:
         filtered_indices = [df.index.get_loc(idx) for idx in filtered_df.index]
         filtered_indices = np.array(filtered_indices, dtype=int)
     else:
         filtered_indices = filtered_df.index.values.astype(int)
     
-    # Calculate similarities only for filtered models
     filtered_embeddings = embeddings[filtered_indices]
     from sklearn.metrics.pairwise import cosine_similarity
     query_embedding_2d = query_embedding.reshape(1, -1)
     similarities = cosine_similarity(query_embedding_2d, filtered_embeddings)[0]
     
-    # Get top k similar models
     top_k_local_indices = np.argpartition(similarities, -k)[-k:]
     top_k_local_indices = top_k_local_indices[np.argsort(similarities[top_k_local_indices])][::-1]
     
-    # Get reduced embeddings for visualization
     if reduced_embeddings is None:
         raise HTTPException(status_code=503, detail="Reduced embeddings not ready")
     
-    # Map back to original indices
     top_k_original_indices = filtered_indices[top_k_local_indices]
     top_k_reduced = reduced_embeddings[top_k_original_indices]
     
-    # Build response
     similar_models = []
     for i, orig_idx in enumerate(top_k_original_indices):
         row = df.iloc[orig_idx]
@@ -935,11 +1141,12 @@ async def get_distance(
     """
     Calculate distance/similarity between two models.
     """
-    global df, embedder, embeddings
-    
-    if df is None or embeddings is None:
+    if deps.df is None or deps.embeddings is None:
         raise HTTPException(status_code=503, detail="Data not loaded")
     
+    df = deps.df
+    embeddings = deps.embeddings
+    
     # Find both models - optimized with index lookup
     if 'model_id' in df.index.names or df.index.name == 'model_id':
         try:
@@ -976,7 +1183,7 @@ async def export_models(model_ids: List[str]):
     Export selected models as JSON with full metadata.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     # Optimized export with index lookup
     if 'model_id' in df.index.names or df.index.name == 'model_id':
@@ -991,7 +1198,6 @@ async def export_models(model_ids: List[str]):
     if len(exported) == 0:
         return {"models": []}
     
-    # Use list comprehension for faster building
     models = [
         {
             "model_id": str(row.get('model_id', '')),
@@ -1029,12 +1235,10 @@ async def get_cooccurrence_network(
     Returns network graph data suitable for visualization.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     try:
         network_builder = ModelNetworkBuilder(df)
-        
-        # Get top models by field
         top_models = network_builder.get_top_models_by_field(
             library=library,
             pipeline_tag=pipeline_tag,
@@ -1051,14 +1255,11 @@ async def get_cooccurrence_network(
             }
         
         model_ids = [mid for mid, _ in top_models]
-        
-        # Build co-occurrence network
         graph = network_builder.build_cooccurrence_network(
             model_ids=model_ids,
             cooccurrence_method=cooccurrence_method
         )
         
-        # Convert to JSON-serializable format
         nodes = []
         for node_id, attrs in graph.nodes(data=True):
             nodes.append({
@@ -1086,45 +1287,70 @@ async def get_cooccurrence_network(
             "links": links,
             "statistics": stats
         }
-    
-    except Exception as e:
+    except (ValueError, KeyError, AttributeError) as e:
+        logger.error(f"Error building network: {e}", exc_info=True)
         raise HTTPException(status_code=500, detail=f"Error building network: {str(e)}")
 
 
 @app.get("/api/network/family/{model_id}")
 async def get_family_network(
     model_id: str,
-    max_depth: int = Query(5, ge=1, le=10)
+    max_depth: Optional[int] = Query(None, ge=1, le=100, description="Maximum depth to traverse. If None, traverses entire tree without limit."),
+    edge_types: Optional[str] = Query(None, description="Comma-separated list of edge types to include (finetune,quantized,adapter,merge,parent). If None, includes all types."),
+    include_edge_attributes: bool = Query(True, description="Whether to include edge attributes (change in likes, downloads, etc.)")
 ):
     """
     Build family tree network for a model (directed graph).
-    Returns network graph data showing parent-child relationships.
+    Returns network graph data showing parent-child relationships with multiple relationship types.
+    Supports filtering by edge type (finetune, quantized, adapter, merge, parent).
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     try:
+        filter_types = None
+        if edge_types:
+            filter_types = [t.strip() for t in edge_types.split(',') if t.strip()]
+        
         network_builder = ModelNetworkBuilder(df)
         graph = network_builder.build_family_tree_network(
             root_model_id=model_id,
-            max_depth=max_depth
+            max_depth=max_depth,
+            include_edge_attributes=include_edge_attributes,
+            filter_edge_types=filter_types
         )
         
-        # Convert to JSON-serializable format
         nodes = []
         for node_id, attrs in graph.nodes(data=True):
             nodes.append({
                 "id": node_id,
                 "title": attrs.get('title', node_id),
-                "freq": attrs.get('freq', 0)
+                "freq": attrs.get('freq', 0),
+                "likes": attrs.get('likes', 0),
+                "downloads": attrs.get('downloads', 0),
+                "library": attrs.get('library', ''),
+                "pipeline": attrs.get('pipeline', '')
             })
         
         links = []
-        for source, target in graph.edges():
-            links.append({
+        for source, target, edge_attrs in graph.edges(data=True):
+            link_data = {
                 "source": source,
-                "target": target
-            })
+                "target": target,
+                "edge_type": edge_attrs.get('edge_type'),
+                "edge_types": edge_attrs.get('edge_types', [])
+            }
+            
+            if include_edge_attributes:
+                link_data.update({
+                    "change_in_likes": edge_attrs.get('change_in_likes'),
+                    "percentage_change_in_likes": edge_attrs.get('percentage_change_in_likes'),
+                    "change_in_downloads": edge_attrs.get('change_in_downloads'),
+                    "percentage_change_in_downloads": edge_attrs.get('percentage_change_in_downloads'),
+                    "change_in_createdAt_days": edge_attrs.get('change_in_createdAt_days')
+                })
+            
+            links.append(link_data)
         
         stats = network_builder.get_network_statistics(graph)
         
@@ -1134,8 +1360,8 @@ async def get_family_network(
             "statistics": stats,
             "root_model": model_id
         }
-    
-    except Exception as e:
+    except (ValueError, KeyError, AttributeError) as e:
+        logger.error(f"Error building family network: {e}", exc_info=True)
         raise HTTPException(status_code=500, detail=f"Error building family network: {str(e)}")
 
 
@@ -1150,11 +1376,10 @@ async def get_model_neighbors(
     Similar to graph database queries for finding connected nodes.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     try:
         network_builder = ModelNetworkBuilder(df)
-        # Build network for top models (for performance)
         top_models = network_builder.get_top_models_by_field(n=1000)
         model_ids = [mid for mid, _ in top_models]
         graph = network_builder.build_cooccurrence_network(model_ids, cooccurrence_method='combined')
@@ -1171,8 +1396,8 @@ async def get_model_neighbors(
             "neighbors": neighbors,
             "count": len(neighbors)
         }
-    
-    except Exception as e:
+    except (ValueError, KeyError, AttributeError) as e:
+        logger.error(f"Error finding neighbors: {e}", exc_info=True)
         raise HTTPException(status_code=500, detail=f"Error finding neighbors: {str(e)}")
 
 
@@ -1187,7 +1412,7 @@ async def find_path_between_models(
     Similar to graph database path queries.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     try:
         network_builder = ModelNetworkBuilder(df)
@@ -1235,7 +1460,7 @@ async def search_by_cooccurrence(
     Similar to graph database queries for co-assignment patterns.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     try:
         network_builder = ModelNetworkBuilder(df)
@@ -1272,7 +1497,7 @@ async def get_model_relationships(
     Similar to graph database relationship queries.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     try:
         network_builder = ModelNetworkBuilder(df)
@@ -1297,32 +1522,57 @@ async def get_model_relationships(
 async def get_current_model_count(
     use_cache: bool = Query(True),
     force_refresh: bool = Query(False),
-    use_dataset_snapshot: bool = Query(False)
+    use_dataset_snapshot: bool = Query(False),
+    use_models_page: bool = Query(True)
 ):
     """
     Get the current number of models on Hugging Face Hub.
-    Fetches live data from the Hub API or uses dataset snapshot (faster but may be outdated).
+    Uses multiple strategies: models page scraping (fastest), dataset snapshot, or API.
     
     Query Parameters:
         use_cache: Use cached results if available (default: True)
         force_refresh: Force refresh even if cache is valid (default: False)
-        use_dataset_snapshot: Use dataset snapshot instead of API (faster, default: False)
+        use_dataset_snapshot: Use dataset snapshot for breakdowns (default: False)
+        use_models_page: Try to get count from HF models page first (default: True)
     """
     try:
+        tracker = get_tracker()
+        
         if use_dataset_snapshot:
-            # Use improved tracker with dataset snapshot (like ai-ecosystem repo)
-            tracker = get_improved_tracker()
-            count_data = tracker.get_count_from_dataset_snapshot()
+            count_data = tracker.get_count_from_models_page()
             if count_data is None:
-                # Fallback to API if dataset unavailable
-                count_data = tracker.get_current_model_count(use_cache=use_cache, force_refresh=force_refresh)
+                count_data = tracker.get_current_model_count(use_models_page=False)
+            else:
+                try:
+                    from utils.data_loader import ModelDataLoader
+                    data_loader = ModelDataLoader()
+                    df = data_loader.load_data(sample_size=10000)
+                    library_counts = {}
+                    pipeline_counts = {}
+                    
+                    for _, row in df.iterrows():
+                        if pd.notna(row.get('library_name')):
+                            lib = str(row.get('library_name'))
+                            library_counts[lib] = library_counts.get(lib, 0) + 1
+                        if pd.notna(row.get('pipeline_tag')):
+                            pipeline = str(row.get('pipeline_tag'))
+                            pipeline_counts[pipeline] = pipeline_counts.get(pipeline, 0) + 1
+                    
+                    if len(df) > 0 and count_data["total_models"] > len(df):
+                        scale_factor = count_data["total_models"] / len(df)
+                        library_counts = {k: int(v * scale_factor) for k, v in library_counts.items()}
+                        pipeline_counts = {k: int(v * scale_factor) for k, v in pipeline_counts.items()}
+                    
+                    count_data["models_by_library"] = library_counts
+                    count_data["models_by_pipeline"] = pipeline_counts
+                except Exception as e:
+                    logger.warning(f"Could not get breakdowns from dataset: {e}")
         else:
-            # Use improved tracker with API (has caching)
-            tracker = get_improved_tracker()
-            count_data = tracker.get_current_model_count(use_cache=use_cache, force_refresh=force_refresh)
+            count_data = tracker.get_current_model_count(use_models_page=use_models_page)
         
         return count_data
     except Exception as e:
+        logger.error(f"Error fetching model count: {e}", exc_info=True)
         raise HTTPException(status_code=500, detail=f"Error fetching model count: {str(e)}")
 
 
@@ -1343,7 +1593,7 @@ async def get_historical_model_counts(
     try:
         from datetime import datetime
         
-        tracker = get_improved_tracker()
+        tracker = get_tracker()
         
         start = None
         end = None
@@ -1373,7 +1623,7 @@ async def get_historical_model_counts(
 async def get_latest_model_count():
     """Get the most recently recorded model count from database."""
     try:
-        tracker = get_improved_tracker()
+        tracker = get_tracker()
         latest = tracker.get_latest_count()
         if latest is None:
             raise HTTPException(status_code=404, detail="No model counts recorded yet")
@@ -1397,16 +1647,14 @@ async def record_model_count(
         use_dataset_snapshot: Use dataset snapshot instead of API (faster, default: False)
     """
     try:
-        tracker = get_improved_tracker()
+        tracker = get_tracker()
         
-        # Fetch and record in background to avoid blocking
         def record():
             if use_dataset_snapshot:
                 count_data = tracker.get_count_from_dataset_snapshot()
                 if count_data:
                     tracker.record_count(count_data, source="dataset_snapshot")
                 else:
-                    # Fallback to API
                     count_data = tracker.get_current_model_count(use_cache=False)
                     tracker.record_count(count_data, source="api")
             else:
@@ -1433,7 +1681,7 @@ async def get_growth_stats(days: int = Query(7, ge=1, le=365)):
         days: Number of days to analyze
     """
     try:
-        tracker = get_improved_tracker()
+        tracker = get_tracker()
         stats = tracker.get_growth_stats(days)
         return stats
     except Exception as e:
@@ -1455,12 +1703,11 @@ async def export_network_graphml(
     Similar to Open Syllabus graph export functionality.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     try:
         network_builder = ModelNetworkBuilder(df)
         
-        # Get top models by field
         top_models = network_builder.get_top_models_by_field(
             library=library,
             pipeline_tag=pipeline_tag,
@@ -1473,29 +1720,24 @@ async def export_network_graphml(
             raise HTTPException(status_code=404, detail="No models found matching criteria")
         
         model_ids = [mid for mid, _ in top_models]
-        
-        # Build co-occurrence network
         graph = network_builder.build_cooccurrence_network(
             model_ids=model_ids,
             cooccurrence_method=cooccurrence_method
         )
         
-        # Create temporary file
         with tempfile.NamedTemporaryFile(mode='w', suffix='.graphml', delete=False) as tmp_file:
             tmp_path = tmp_file.name
             network_builder.export_graphml(graph, tmp_path)
         
-        # Schedule cleanup after response is sent
         background_tasks.add_task(os.unlink, tmp_path)
         
-        # Return file for download
         return FileResponse(
             tmp_path,
             media_type='application/xml',
             filename=f'network_{cooccurrence_method}_{n}_models.graphml'
         )
-    
-    except Exception as e:
+    except (ValueError, KeyError, AttributeError, IOError) as e:
+        logger.error(f"Error exporting network: {e}", exc_info=True)
         raise HTTPException(status_code=500, detail=f"Error exporting network: {str(e)}")
 
 
@@ -1506,7 +1748,7 @@ async def get_model_papers(model_id: str):
     Extracts arXiv IDs from model tags and fetches paper information.
     """
     if df is None:
-        raise HTTPException(status_code=503, detail="Data not loaded")
+        raise DataNotLoadedError()
     
     model = df[df.get('model_id', '') == model_id]
     if len(model) == 0:
@@ -1535,36 +1777,131 @@ async def get_model_papers(model_id: str):
     }
 
 
+@app.get("/api/models/minimal.bin")
+async def get_minimal_binary():
+    """
+    Serve the binary minimal dataset file.
+    This is optimized for fast client-side loading.
+    """
+    backend_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+    root_dir = os.path.dirname(backend_dir)
+    binary_path = os.path.join(root_dir, "cache", "binary", "embeddings.bin")
+    
+    if not os.path.exists(binary_path):
+        raise HTTPException(status_code=404, detail="Binary dataset not found. Run export_binary.py first.")
+    
+    return FileResponse(
+        binary_path,
+        media_type="application/octet-stream",
+        headers={
+            "Content-Disposition": "attachment; filename=embeddings.bin",
+            "Cache-Control": "public, max-age=3600"
+        }
+    )
+
+
+@app.get("/api/models/model_ids.json")
+async def get_model_ids_json():
+    """Serve the model IDs JSON file."""
+    backend_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+    root_dir = os.path.dirname(backend_dir)
+    json_path = os.path.join(root_dir, "cache", "binary", "model_ids.json")
+    
+    if not os.path.exists(json_path):
+        raise HTTPException(status_code=404, detail="Model IDs file not found.")
+    
+    return FileResponse(
+        json_path,
+        media_type="application/json",
+        headers={"Cache-Control": "public, max-age=3600"}
+    )
+
+
+@app.get("/api/models/metadata.json")
+async def get_metadata_json():
+    """Serve the metadata JSON file with lookup tables."""
+    backend_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+    root_dir = os.path.dirname(backend_dir)
+    json_path = os.path.join(root_dir, "cache", "binary", "metadata.json")
+    
+    if not os.path.exists(json_path):
+        raise HTTPException(status_code=404, detail="Metadata file not found.")
+    
+    return FileResponse(
+        json_path,
+        media_type="application/json",
+        headers={"Cache-Control": "public, max-age=3600"}
+    )
+
+
 @app.get("/api/model/{model_id}/files")
 async def get_model_files(model_id: str, branch: str = Query("main")):
     """
     Get file tree for a model from Hugging Face.
     Proxies the request to avoid CORS issues.
+    Returns a flat list of files with path and size information.
     """
+    if not model_id or not model_id.strip():
+        raise HTTPException(status_code=400, detail="Invalid model ID")
+    
+    branches_to_try = [branch, "main", "master"] if branch not in ["main", "master"] else [branch, "main" if branch == "master" else "master"]
+    
     try:
-        # Try main branch first, then master
-        branches_to_try = [branch, "main", "master"] if branch not in ["main", "master"] else [branch, "main" if branch == "master" else "master"]
-        
-        async with httpx.AsyncClient(timeout=10.0) as client:
+        async with httpx.AsyncClient(timeout=15.0) as client:
             for branch_name in branches_to_try:
                 try:
                     url = f"https://huggingface.co/api/models/{model_id}/tree/{branch_name}"
                     response = await client.get(url)
+                    
                     if response.status_code == 200:
-                        return response.json()
-                except Exception:
+                        data = response.json()
+                        # Ensure we return an array
+                        if isinstance(data, list):
+                            return data
+                        elif isinstance(data, dict) and 'tree' in data:
+                            return data['tree']
+                        else:
+                            return []
+                    
+                    elif response.status_code == 404:
+                        # Try next branch
+                        continue
+                    else:
+                        logger.warning(f"Unexpected status {response.status_code} for {url}")
+                        continue
+                        
+                except httpx.HTTPStatusError as e:
+                    if e.response.status_code == 404:
+                        continue  # Try next branch
+                    logger.warning(f"HTTP error for branch {branch_name}: {e}")
+                    continue
+                except httpx.HTTPError as e:
+                    logger.warning(f"HTTP error for branch {branch_name}: {e}")
                     continue
             
-            raise HTTPException(status_code=404, detail="File tree not found for this model")
+            # All branches failed
+            raise HTTPException(
+                status_code=404, 
+                detail=f"File tree not found for model '{model_id}'. The model may not exist or may not have any files."
+            )
+            
     except httpx.TimeoutException:
-        raise HTTPException(status_code=504, detail="Request to Hugging Face timed out")
+        raise HTTPException(
+            status_code=504, 
+            detail="Request to Hugging Face timed out. Please try again later."
+        )
+    except HTTPException:
+        raise  # Re-raise HTTP exceptions
     except Exception as e:
-        raise HTTPException(status_code=500, detail=f"Error fetching file tree: {str(e)}")
+        logger.error(f"Error fetching file tree: {e}", exc_info=True)
+        raise HTTPException(
+            status_code=500, 
+            detail=f"Error fetching file tree: {str(e)}"
+        )
 
 
 if __name__ == "__main__":
     import uvicorn
-    # Use PORT environment variable for cloud platforms (Railway, Render, Heroku)
     port = int(os.getenv("PORT", 8000))
     uvicorn.run(app, host="0.0.0.0", port=port)
 
diff --git a/backend/api/routes/__init__.py b/backend/api/routes/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..d3b07a869e15406215660fc24e61e49a1cb246ff
--- /dev/null
+++ b/backend/api/routes/__init__.py
@@ -0,0 +1,6 @@
+"""
+API route modules.
+"""
+from . import models, stats, clusters
+
+__all__ = ['models', 'stats', 'clusters']
diff --git a/backend/api/routes/clusters.py b/backend/api/routes/clusters.py
new file mode 100644
index 0000000000000000000000000000000000000000..a54280b8f2bb8aa7e80758d4d1a39db0e81e9a4d
--- /dev/null
+++ b/backend/api/routes/clusters.py
@@ -0,0 +1,102 @@
+"""
+API routes for cluster endpoints.
+"""
+from fastapi import APIRouter
+import numpy as np
+import pandas as pd
+from core.exceptions import DataNotLoadedError
+import api.dependencies as deps
+
+router = APIRouter(prefix="/api", tags=["clusters"])
+
+
+@router.get("/clusters")
+async def get_clusters():
+    """Get all clusters with metadata and hierarchical labels."""
+    if deps.df is None:
+        raise DataNotLoadedError()
+    
+    # Import cluster_labels from models route
+    from api.routes.models import cluster_labels
+    
+    # If clusters haven't been computed yet, return empty list instead of error
+    # This allows the frontend to work while data is still loading
+    if cluster_labels is None:
+        return {"clusters": []}
+    
+    df = deps.df
+    
+    # Generate hierarchical labels for clusters
+    clusters = []
+    unique_clusters = np.unique(cluster_labels)
+    
+    for cluster_id in unique_clusters:
+        cluster_mask = cluster_labels == cluster_id
+        cluster_models = df[cluster_mask]
+        
+        if len(cluster_models) == 0:
+            continue
+        
+        # Generate hierarchical label
+        library_counts = cluster_models['library_name'].value_counts()
+        pipeline_counts = cluster_models['pipeline_tag'].value_counts()
+        
+        # Determine primary domain/library
+        if len(library_counts) > 0:
+            primary_lib = library_counts.index[0]
+            if primary_lib and pd.notna(primary_lib):
+                if 'transformers' in str(primary_lib).lower():
+                    domain = "NLP"
+                elif 'diffusers' in str(primary_lib).lower():
+                    domain = "Multimodal"
+                elif 'timm' in str(primary_lib).lower():
+                    domain = "Computer Vision"
+                else:
+                    domain = str(primary_lib).replace('_', ' ').title()
+            else:
+                domain = "Other"
+        else:
+            domain = "Other"
+        
+        # Determine subdomain from pipeline
+        if len(pipeline_counts) > 0:
+            primary_pipeline = pipeline_counts.index[0]
+            if primary_pipeline and pd.notna(primary_pipeline):
+                subdomain = str(primary_pipeline).replace('-', ' ').replace('_', ' ').title()
+            else:
+                subdomain = "General"
+        else:
+            subdomain = "General"
+        
+        # Determine characteristics
+        characteristics = []
+        model_ids_lower = cluster_models['model_id'].astype(str).str.lower()
+        if model_ids_lower.str.contains('gpt', na=False).any():
+            characteristics.append("GPT-based")
+        if cluster_models['parent_model'].notna().any():
+            characteristics.append("Fine-tuned")
+        if not characteristics:
+            characteristics.append("Base Models")
+        
+        char_str = "; ".join(characteristics)
+        label = f"{domain} — {subdomain} ({char_str})"
+        
+        # Generate color (use consistent colors based on cluster_id)
+        colors = [
+            "#1f77b4", "#ff7f0e", "#2ca02c", "#d62728", "#9467bd",
+            "#8c564b", "#e377c2", "#7f7f7f", "#bcbd22", "#17becf"
+        ]
+        color = colors[cluster_id % len(colors)]
+        
+        clusters.append({
+            "cluster_id": int(cluster_id),
+            "cluster_label": label,
+            "count": int(len(cluster_models)),
+            "color": color
+        })
+    
+    # Sort by count descending
+    clusters.sort(key=lambda x: x["count"], reverse=True)
+    
+    return {"clusters": clusters}
+
diff --git a/backend/api/routes/models.py b/backend/api/routes/models.py
new file mode 100644
index 0000000000000000000000000000000000000000..652553fa8ceea430d2f3b2fdeb735197d61d326e
--- /dev/null
+++ b/backend/api/routes/models.py
@@ -0,0 +1,247 @@
+"""
+API routes for model data endpoints.
+"""
+from typing import Optional
+from fastapi import APIRouter, Query, HTTPException
+import numpy as np
+import pandas as pd
+import pickle
+import os
+import logging
+
+from umap import UMAP
+from models.schemas import ModelPoint
+from utils.family_tree import calculate_family_depths
+from utils.dimensionality_reduction import DimensionReducer
+from core.exceptions import DataNotLoadedError, EmbeddingsNotReadyError
+import api.dependencies as deps
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter(prefix="/api", tags=["models"])
+
+# Global cluster labels cache (shared across routes)
+cluster_labels = None
+
+
+def compute_clusters(reduced_embeddings: np.ndarray, n_clusters: int = 50) -> np.ndarray:
+    from sklearn.cluster import KMeans
+    
+    n_samples = len(reduced_embeddings)
+    if n_samples < n_clusters:
+        n_clusters = max(1, n_samples // 10)
+    
+    kmeans = KMeans(n_clusters=n_clusters, random_state=42, n_init=10)
+    return kmeans.fit_predict(reduced_embeddings)
+
+
+@router.get("/models")
+async def get_models(
+    min_downloads: int = Query(0),
+    min_likes: int = Query(0),
+    search_query: Optional[str] = Query(None),
+    color_by: str = Query("library_name"),
+    size_by: str = Query("downloads"),
+    max_points: Optional[int] = Query(None),
+    projection_method: str = Query("umap"),
+    base_models_only: bool = Query(False),
+    max_hierarchy_depth: Optional[int] = Query(None, ge=0, description="Filter to models at or below this hierarchy depth."),
+    use_graph_embeddings: bool = Query(False, description="Use graph-aware embeddings that respect family tree structure")
+):
+    if deps.df is None:
+        raise DataNotLoadedError()
+    
+    df = deps.df
+    data_loader = deps.data_loader
+    
+    # Filter data
+    filtered_df = data_loader.filter_data(
+        df=df,
+        min_downloads=min_downloads,
+        min_likes=min_likes,
+        search_query=search_query,
+        libraries=None,
+        pipeline_tags=None
+    )
+    
+    if base_models_only:
+        if 'parent_model' in filtered_df.columns:
+            filtered_df = filtered_df[
+                filtered_df['parent_model'].isna() | 
+                (filtered_df['parent_model'].astype(str).str.strip() == '') |
+                (filtered_df['parent_model'].astype(str) == 'nan')
+            ]
+    
+    if max_hierarchy_depth is not None:
+        family_depths = calculate_family_depths(df)
+        filtered_df = filtered_df[
+            filtered_df['model_id'].astype(str).map(lambda x: family_depths.get(x, 0) <= max_hierarchy_depth)
+        ]
+    
+    filtered_count = len(filtered_df)
+    
+    if len(filtered_df) == 0:
+        return {
+            "models": [],
+            "filtered_count": 0,
+            "returned_count": 0
+        }
+    
+    if max_points is not None and len(filtered_df) > max_points:
+        if 'library_name' in filtered_df.columns and filtered_df['library_name'].notna().any():
+            sampled_dfs = []
+            for lib_name, group in filtered_df.groupby('library_name', group_keys=False):
+                n_samples = max(1, int(max_points * len(group) / len(filtered_df)))
+                sampled_dfs.append(group.sample(min(len(group), n_samples), random_state=42))
+            filtered_df = pd.concat(sampled_dfs, ignore_index=True)
+            if len(filtered_df) > max_points:
+                filtered_df = filtered_df.sample(n=max_points, random_state=42).reset_index(drop=True)
+            else:
+                filtered_df = filtered_df.reset_index(drop=True)
+        else:
+            filtered_df = filtered_df.sample(n=max_points, random_state=42).reset_index(drop=True)
+    
+    # Determine which embeddings to use
+    if use_graph_embeddings and deps.combined_embeddings is not None:
+        current_embeddings = deps.combined_embeddings
+        current_reduced = deps.reduced_embeddings_graph
+        embedding_type = "graph-aware"
+    else:
+        if deps.embeddings is None:
+            raise EmbeddingsNotReadyError()
+        current_embeddings = deps.embeddings
+        current_reduced = deps.reduced_embeddings
+        embedding_type = "text-only"
+    
+    # Handle reduced embeddings loading/generation
+    reducer = deps.reducer
+    if current_reduced is None or (reducer and reducer.method != projection_method.lower()):
+        backend_dir = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+        root_dir = os.path.dirname(backend_dir)
+        cache_dir = os.path.join(root_dir, "cache")
+        cache_suffix = "_graph" if use_graph_embeddings and deps.combined_embeddings is not None else ""
+        reduced_cache = os.path.join(cache_dir, f"reduced_{projection_method.lower()}_3d{cache_suffix}.pkl")
+        reducer_cache = os.path.join(cache_dir, f"reducer_{projection_method.lower()}_3d{cache_suffix}.pkl")
+        
+        if os.path.exists(reduced_cache) and os.path.exists(reducer_cache):
+            try:
+                with open(reduced_cache, 'rb') as f:
+                    current_reduced = pickle.load(f)
+                if reducer is None or reducer.method != projection_method.lower():
+                    reducer = DimensionReducer(method=projection_method.lower(), n_components=3)
+                reducer.load_reducer(reducer_cache)
+            except (IOError, pickle.UnpicklingError, EOFError) as e:
+                logger.warning(f"Failed to load cached reduced embeddings: {e}")
+                current_reduced = None
+        
+        if current_reduced is None:
+            if reducer is None or reducer.method != projection_method.lower():
+                reducer = DimensionReducer(method=projection_method.lower(), n_components=3)
+                if projection_method.lower() == "umap":
+                    reducer.reducer = UMAP(
+                        n_components=3,
+                        n_neighbors=30,
+                        min_dist=0.3,
+                        metric='cosine',
+                        random_state=42,
+                        n_jobs=-1,
+                        low_memory=True,
+                        spread=1.5
+                    )
+            current_reduced = reducer.fit_transform(current_embeddings)
+            with open(reduced_cache, 'wb') as f:
+                pickle.dump(current_reduced, f)
+            reducer.save_reducer(reducer_cache)
+            
+            # Update global variable
+            if use_graph_embeddings and deps.combined_embeddings is not None:
+                deps.reduced_embeddings_graph = current_reduced
+            else:
+                deps.reduced_embeddings = current_reduced
+    
+    # Get indices for filtered data
+    filtered_model_ids = filtered_df['model_id'].astype(str).values
+    
+    if df.index.name == 'model_id' or 'model_id' in df.index.names:
+        filtered_indices = []
+        for model_id in filtered_model_ids:
+            try:
+                pos = df.index.get_loc(model_id)
+                if isinstance(pos, (int, np.integer)):
+                    filtered_indices.append(int(pos))
+                elif isinstance(pos, (slice, np.ndarray)):
+                    if isinstance(pos, slice):
+                        filtered_indices.append(int(pos.start))
+                    else:
+                        filtered_indices.append(int(pos[0]))
+            except (KeyError, TypeError):
+                continue
+        filtered_indices = np.array(filtered_indices, dtype=np.int32)
+    else:
+        df_model_ids = df['model_id'].astype(str).values
+        model_id_to_pos = {mid: pos for pos, mid in enumerate(df_model_ids)}
+        filtered_indices = np.array([
+            model_id_to_pos[mid] for mid in filtered_model_ids 
+            if mid in model_id_to_pos
+        ], dtype=np.int32)
+    
+    if len(filtered_indices) == 0:
+        return {
+            "models": [],
+            "embedding_type": embedding_type,
+            "filtered_count": filtered_count,
+            "returned_count": 0
+        }
+    
+    filtered_reduced = current_reduced[filtered_indices]
+    family_depths = calculate_family_depths(df)
+    
+    global cluster_labels
+    clustering_embeddings = current_reduced
+    if cluster_labels is None or len(cluster_labels) != len(clustering_embeddings):
+        cluster_labels = compute_clusters(clustering_embeddings, n_clusters=min(50, len(clustering_embeddings) // 100))
+    
+    filtered_clusters = cluster_labels[filtered_indices]
+    
+    model_ids = filtered_df['model_id'].astype(str).values
+    library_names = filtered_df.get('library_name', pd.Series([None] * len(filtered_df))).values
+    pipeline_tags = filtered_df.get('pipeline_tag', pd.Series([None] * len(filtered_df))).values
+    downloads_arr = filtered_df.get('downloads', pd.Series([0] * len(filtered_df))).fillna(0).astype(int).values
+    likes_arr = filtered_df.get('likes', pd.Series([0] * len(filtered_df))).fillna(0).astype(int).values
+    trending_scores = filtered_df.get('trendingScore', pd.Series([None] * len(filtered_df))).values
+    tags_arr = filtered_df.get('tags', pd.Series([None] * len(filtered_df))).values
+    parent_models = filtered_df.get('parent_model', pd.Series([None] * len(filtered_df))).values
+    licenses_arr = filtered_df.get('licenses', pd.Series([None] * len(filtered_df))).values
+    created_at_arr = filtered_df.get('createdAt', pd.Series([None] * len(filtered_df))).values
+    
+    x_coords = filtered_reduced[:, 0].astype(float)
+    y_coords = filtered_reduced[:, 1].astype(float)
+    z_coords = filtered_reduced[:, 2].astype(float) if filtered_reduced.shape[1] > 2 else np.zeros(len(filtered_reduced), dtype=float)
+    models = [
+        ModelPoint(
+            model_id=model_ids[idx],
+            x=float(x_coords[idx]),
+            y=float(y_coords[idx]),
+            z=float(z_coords[idx]),
+            library_name=library_names[idx] if pd.notna(library_names[idx]) else None,
+            pipeline_tag=pipeline_tags[idx] if pd.notna(pipeline_tags[idx]) else None,
+            downloads=int(downloads_arr[idx]),
+            likes=int(likes_arr[idx]),
+            trending_score=float(trending_scores[idx]) if idx < len(trending_scores) and pd.notna(trending_scores[idx]) else None,
+            tags=tags_arr[idx] if idx < len(tags_arr) and pd.notna(tags_arr[idx]) else None,
+            parent_model=parent_models[idx] if idx < len(parent_models) and pd.notna(parent_models[idx]) else None,
+            licenses=licenses_arr[idx] if idx < len(licenses_arr) and pd.notna(licenses_arr[idx]) else None,
+            family_depth=family_depths.get(model_ids[idx], None),
+            cluster_id=int(filtered_clusters[idx]) if idx < len(filtered_clusters) else None,
+            created_at=str(created_at_arr[idx]) if idx < len(created_at_arr) and pd.notna(created_at_arr[idx]) else None
+        )
+        for idx in range(len(filtered_df))
+    ]
+    
+    return {
+        "models": models,
+        "embedding_type": embedding_type,
+        "filtered_count": filtered_count,
+        "returned_count": len(models)
+    }
+
diff --git a/backend/api/routes/stats.py b/backend/api/routes/stats.py
new file mode 100644
index 0000000000000000000000000000000000000000..860cf3ce4bff0f6f09a507de89bf4286bbdfc353
--- /dev/null
+++ b/backend/api/routes/stats.py
@@ -0,0 +1,37 @@
+"""
+API routes for statistics endpoints.
+"""
+from fastapi import APIRouter
+from core.exceptions import DataNotLoadedError
+import api.dependencies as deps
+
+router = APIRouter(prefix="/api", tags=["stats"])
+
+
+@router.get("/stats")
+async def get_stats():
+    """Get dataset statistics."""
+    if deps.df is None:
+        raise DataNotLoadedError()
+    
+    df = deps.df
+    total_models = len(df.index) if hasattr(df, 'index') else len(df)
+    
+    # Get unique licenses with counts
+    licenses = {}
+    if 'license' in df.columns:
+        import pandas as pd
+        license_counts = df['license'].value_counts().to_dict()
+        licenses = {str(k): int(v) for k, v in license_counts.items() if pd.notna(k) and str(k) != 'nan'}
+    
+    return {
+        "total_models": total_models,
+        "unique_libraries": int(df['library_name'].nunique()) if 'library_name' in df.columns else 0,
+        "unique_pipelines": int(df['pipeline_tag'].nunique()) if 'pipeline_tag' in df.columns else 0,
+        "unique_task_types": int(df['pipeline_tag'].nunique()) if 'pipeline_tag' in df.columns else 0,
+        "unique_licenses": len(licenses),
+        "licenses": licenses,
+        "avg_downloads": float(df['downloads'].mean()) if 'downloads' in df.columns else 0,
+        "avg_likes": float(df['likes'].mean()) if 'likes' in df.columns else 0
+    }
+
diff --git a/backend/config/requirements.txt b/backend/config/requirements.txt
index e3fc460ac083eeb1f04d3a75dd2197b054ceba11..8eaf5280322ea510e16ac3585888adff4098f9c3 100644
--- a/backend/config/requirements.txt
+++ b/backend/config/requirements.txt
@@ -11,5 +11,6 @@ huggingface-hub>=0.17.0
 schedule>=1.2.0
 tqdm>=4.66.0
 networkx>=3.0
+node2vec>=0.4.6
 httpx>=0.24.0
 
diff --git a/backend/core/__init__.py b/backend/core/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..5e62adb7dc738fd84ba2f2b6464adff697c3fd40
--- /dev/null
+++ b/backend/core/__init__.py
@@ -0,0 +1,2 @@
+"""Core configuration and utilities."""
+
diff --git a/backend/core/config.py b/backend/core/config.py
new file mode 100644
index 0000000000000000000000000000000000000000..6d6be5ca4796f84263b138e672be392078791bac
--- /dev/null
+++ b/backend/core/config.py
@@ -0,0 +1,23 @@
+"""Configuration management."""
+import os
+from typing import Optional
+
+class Settings:
+    """Application settings."""
+    FRONTEND_URL: str = os.getenv("FRONTEND_URL", "http://localhost:3000")
+    ALLOW_ALL_ORIGINS: bool = os.getenv("ALLOW_ALL_ORIGINS", "True").lower() in ("true", "1", "yes")
+    SAMPLE_SIZE: Optional[int] = None
+    USE_GRAPH_EMBEDDINGS: bool = os.getenv("USE_GRAPH_EMBEDDINGS", "false").lower() == "true"
+    PORT: int = int(os.getenv("PORT", 8000))
+    
+    @classmethod
+    def get_sample_size(cls) -> Optional[int]:
+        """Get sample size from environment."""
+        sample_size_env = os.getenv("SAMPLE_SIZE")
+        if sample_size_env:
+            sample_size_val = int(sample_size_env)
+            return sample_size_val if sample_size_val > 0 else None
+        return None
+
+settings = Settings()
+
diff --git a/backend/core/exceptions.py b/backend/core/exceptions.py
new file mode 100644
index 0000000000000000000000000000000000000000..a27af9dc314e746f2046d8a86054be76a7858fab
--- /dev/null
+++ b/backend/core/exceptions.py
@@ -0,0 +1,18 @@
+"""Custom exceptions."""
+from fastapi import HTTPException
+
+class ModelNotFoundError(HTTPException):
+    """Model not found exception."""
+    def __init__(self, model_id: str):
+        super().__init__(status_code=404, detail=f"Model not found: {model_id}")
+
+class DataNotLoadedError(HTTPException):
+    """Data not loaded exception."""
+    def __init__(self):
+        super().__init__(status_code=503, detail="Data not loaded")
+
+class EmbeddingsNotReadyError(HTTPException):
+    """Embeddings not ready exception."""
+    def __init__(self):
+        super().__init__(status_code=503, detail="Embeddings not ready")
+
diff --git a/backend/models/__init__.py b/backend/models/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..ef80f4c2c943e8b1049df1a8e5bc7092d1e34117
--- /dev/null
+++ b/backend/models/__init__.py
@@ -0,0 +1,2 @@
+"""Data models and schemas."""
+
diff --git a/backend/models/schemas.py b/backend/models/schemas.py
new file mode 100644
index 0000000000000000000000000000000000000000..60dec7be36259a9a470ab3a73d6e540c6c69d740
--- /dev/null
+++ b/backend/models/schemas.py
@@ -0,0 +1,22 @@
+"""Pydantic models for API."""
+from pydantic import BaseModel
+from typing import Optional
+
+class ModelPoint(BaseModel):
+    """Model point in 3D space."""
+    model_id: str
+    x: float
+    y: float
+    z: float
+    library_name: Optional[str]
+    pipeline_tag: Optional[str]
+    downloads: int
+    likes: int
+    trending_score: Optional[float]
+    tags: Optional[str]
+    parent_model: Optional[str] = None
+    licenses: Optional[str] = None
+    family_depth: Optional[int] = None
+    cluster_id: Optional[int] = None
+    created_at: Optional[str] = None  # ISO format date string
+
diff --git a/backend/scripts/export_binary.py b/backend/scripts/export_binary.py
new file mode 100644
index 0000000000000000000000000000000000000000..ff710fa9b8b3456f1f27fb9812680c14a8504fcc
--- /dev/null
+++ b/backend/scripts/export_binary.py
@@ -0,0 +1,263 @@
+"""
+Export minimal dataset to binary format for fast client-side loading.
+This creates a compact binary representation optimized for WebGL rendering.
+"""
+import struct
+import json
+import numpy as np
+import pandas as pd
+from pathlib import Path
+import sys
+import os
+
+# Add parent directory to path
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+
+from utils.data_loader import ModelDataLoader
+from utils.dimensionality_reduction import DimensionReducer
+from utils.embeddings import ModelEmbedder
+
+
+def calculate_family_depths(df: pd.DataFrame) -> dict:
+    """Calculate depth of each model in its family tree."""
+    depths = {}
+    
+    def get_depth(model_id: str, visited: set = None) -> int:
+        if visited is None:
+            visited = set()
+        if model_id in visited:
+            return 0  # Cycle detected
+        visited.add(model_id)
+        
+        if model_id in depths:
+            return depths[model_id]
+        
+        parent_col = df.get('parent_model', pd.Series([None] * len(df), index=df.index))
+        model_row = df[df['model_id'] == model_id]
+        
+        if model_row.empty:
+            depths[model_id] = 0
+            return 0
+        
+        parent = model_row.iloc[0].get('parent_model')
+        if pd.isna(parent) or parent == '' or str(parent) == 'nan':
+            depths[model_id] = 0
+            return 0
+        
+        parent_depth = get_depth(str(parent), visited.copy())
+        depth = parent_depth + 1
+        depths[model_id] = depth
+        return depth
+    
+    for model_id in df['model_id'].unique():
+        if model_id not in depths:
+            get_depth(str(model_id))
+    
+    return depths
+
+
+def export_binary_dataset(df: pd.DataFrame, reduced_embeddings: np.ndarray, output_dir: Path):
+    """
+    Export minimal dataset to binary format for fast client-side loading.
+    
+    Binary format:
+    - Header (64 bytes): magic, version, counts, lookup table sizes
+    - Domain lookup table (32 bytes per domain)
+    - License lookup table (32 bytes per license)
+    - Family lookup table (32 bytes per family)
+    - Model records (16 bytes each): x, y, z, domain_id, license_id, family_id, flags
+    """
+    output_dir.mkdir(parents=True, exist_ok=True)
+    
+    print(f"Exporting {len(df)} models to binary format...")
+    
+    # Ensure we have coordinates
+    if 'x' not in df.columns or 'y' not in df.columns:
+        if reduced_embeddings is None or len(reduced_embeddings) != len(df):
+            raise ValueError("Need reduced embeddings to generate coordinates")
+        
+        df['x'] = reduced_embeddings[:, 0] if reduced_embeddings.shape[1] > 0 else 0.0
+        df['y'] = reduced_embeddings[:, 1] if reduced_embeddings.shape[1] > 1 else 0.0
+        df['z'] = reduced_embeddings[:, 2] if reduced_embeddings.shape[1] > 2 else 0.0
+    
+    # Create lookup tables
+    # Domain = library_name
+    domains = sorted(df['library_name'].dropna().astype(str).unique())
+    domains = [d for d in domains if d and d != 'nan'][:255]  # Limit to 255
+    
+    # License
+    licenses = sorted(df['license'].dropna().astype(str).unique())
+    licenses = [l for l in licenses if l and l != 'nan'][:255]  # Limit to 255
+    
+    # Family ID mapping (use parent_model to create family groups)
+    family_depths = calculate_family_depths(df)
+    
+    # Create family mapping: group models by root parent
+    def get_root_parent(model_id: str) -> str:
+        visited = set()
+        current = str(model_id)
+        while current in visited == False:
+            visited.add(current)
+            model_row = df[df['model_id'] == current]
+            if model_row.empty:
+                return current
+            parent = model_row.iloc[0].get('parent_model')
+            if pd.isna(parent) or parent == '' or str(parent) == 'nan':
+                return current
+            current = str(parent)
+        return current
+    
+    root_parents = {}
+    family_counter = 0
+    for model_id in df['model_id'].unique():
+        root = get_root_parent(str(model_id))
+        if root not in root_parents:
+            root_parents[root] = family_counter
+            family_counter += 1
+    
+    # Map each model to its family
+    model_to_family = {}
+    for model_id in df['model_id'].unique():
+        root = get_root_parent(str(model_id))
+        model_to_family[str(model_id)] = root_parents.get(root, 65535)
+    
+    # Limit families to 65535 (u16 max)
+    if len(root_parents) > 65535:
+        # Use hash-based family IDs
+        import hashlib
+        for model_id in df['model_id'].unique():
+            root = get_root_parent(str(model_id))
+            family_hash = int(hashlib.md5(root.encode()).hexdigest()[:4], 16) % 65535
+            model_to_family[str(model_id)] = family_hash
+    
+    # Prepare model records
+    records = []
+    model_ids = []
+    
+    for idx, row in df.iterrows():
+        model_id = str(row['model_id'])
+        model_ids.append(model_id)
+        
+        # Get coordinates
+        x = float(row.get('x', 0.0))
+        y = float(row.get('y', 0.0))
+        z = float(row.get('z', 0.0))
+        
+        # Encode domain (library_name)
+        domain_str = str(row.get('library_name', ''))
+        domain_id = domains.index(domain_str) if domain_str in domains else 255
+        
+        # Encode license
+        license_str = str(row.get('license', ''))
+        license_id = licenses.index(license_str) if license_str in licenses else 255
+        
+        # Encode family
+        family_id = model_to_family.get(model_id, 65535)
+        
+        # Encode flags
+        flags = 0
+        parent = row.get('parent_model')
+        if pd.isna(parent) or parent == '' or str(parent) == 'nan':
+            flags |= 0x01  # is_base_model
+        
+        # Check if has children (simple check - could be improved)
+        children = df[df['parent_model'] == model_id]
+        if len(children) > 0:
+            flags |= 0x04  # has_children
+        elif not pd.isna(parent) and parent != '' and str(parent) != 'nan':
+            flags |= 0x02  # has_parent
+        
+        # Pack record: f32 x, f32 y, f32 z, u8 domain, u8 license, u16 family, u8 flags
+        records.append(struct.pack('fffBBBH', x, y, z, domain_id, license_id, family_id, flags))
+    
+    num_models = len(records)
+    
+    # Write binary file
+    with open(output_dir / 'embeddings.bin', 'wb') as f:
+        # Header (64 bytes)
+        header = struct.pack('5sBIIIBBH50s',
+            b'HFVIZ',  # magic (5 bytes)
+            1,  # version (1 byte)
+            num_models,  # num_models (4 bytes)
+            len(domains),  # num_domains (4 bytes)
+            len(licenses),  # num_licenses (4 bytes)
+            len(set(model_to_family.values())),  # num_families (4 bytes)
+            0,  # reserved (1 byte)
+            0,  # reserved (1 byte)
+            0,  # reserved (2 bytes)
+            b'\x00' * 50  # padding (50 bytes)
+        )
+        f.write(header)
+        
+        # Domain lookup table (32 bytes per domain, null-terminated)
+        for domain in domains:
+            domain_bytes = domain.encode('utf-8')[:31]
+            f.write(domain_bytes.ljust(32, b'\x00'))
+        
+        # License lookup table (32 bytes per license)
+        for license in licenses:
+            license_bytes = license.encode('utf-8')[:31]
+            f.write(license_bytes.ljust(32, b'\x00'))
+        
+        # Model records
+        f.write(b''.join(records))
+    
+    # Write model IDs JSON (separate file for string table)
+    with open(output_dir / 'model_ids.json', 'w') as f:
+        json.dump(model_ids, f)
+    
+    # Write metadata JSON
+    metadata = {
+        'domains': domains,
+        'licenses': licenses,
+        'num_models': num_models,
+        'num_families': len(set(model_to_family.values())),
+        'version': 1
+    }
+    with open(output_dir / 'metadata.json', 'w') as f:
+        json.dump(metadata, f, indent=2)
+    
+    binary_size = (output_dir / 'embeddings.bin').stat().st_size
+    json_size = (output_dir / 'model_ids.json').stat().st_size
+    
+    print(f"✓ Exported {num_models} models")
+    print(f"✓ Binary size: {binary_size / 1024 / 1024:.2f} MB")
+    print(f"✓ Model IDs JSON: {json_size / 1024 / 1024:.2f} MB")
+    print(f"✓ Total: {(binary_size + json_size) / 1024 / 1024:.2f} MB")
+    print(f"✓ Domains: {len(domains)}")
+    print(f"✓ Licenses: {len(licenses)}")
+    print(f"✓ Families: {len(set(model_to_family.values()))}")
+
+
+if __name__ == '__main__':
+    import argparse
+    
+    parser = argparse.ArgumentParser(description='Export dataset to binary format')
+    parser.add_argument('--output', type=str, default='backend/cache/binary', help='Output directory')
+    parser.add_argument('--sample-size', type=int, default=None, help='Sample size (for testing)')
+    args = parser.parse_args()
+    
+    output_dir = Path(args.output)
+    
+    # Load data
+    print("Loading dataset...")
+    data_loader = ModelDataLoader()
+    df = data_loader.load_data(sample_size=args.sample_size)
+    df = data_loader.preprocess_for_embedding(df)
+    
+    # Generate embeddings and reduce dimensions if needed
+    if 'x' not in df.columns or 'y' not in df.columns:
+        print("Generating embeddings...")
+        embedder = ModelEmbedder()
+        embeddings = embedder.generate_embeddings(df['combined_text'].tolist())
+        
+        print("Reducing dimensions...")
+        reducer = DimensionReducer()
+        reduced_embeddings = reducer.reduce_dimensions(embeddings, n_components=3, method='umap')
+    else:
+        reduced_embeddings = None
+    
+    # Export
+    export_binary_dataset(df, reduced_embeddings, output_dir)
+    print("Done!")
+
diff --git a/backend/services/model_tracker.py b/backend/services/model_tracker.py
index eb93d3f419492b53d9129237598f0aac88307858..092e59eaaa3d46594ed55085a229c593ec9826b4 100644
--- a/backend/services/model_tracker.py
+++ b/backend/services/model_tracker.py
@@ -5,11 +5,16 @@ Tracks the number of models over time and provides historical data.
 import os
 import json
 import sqlite3
+import logging
+import re
 from datetime import datetime, timedelta
 from typing import Dict, List, Optional, Tuple
 from huggingface_hub import HfApi
 import pandas as pd
 from pathlib import Path
+import httpx
+
+logger = logging.getLogger(__name__)
 
 
 class ModelCountTracker:
@@ -34,7 +39,6 @@ class ModelCountTracker:
         conn = sqlite3.connect(self.db_path)
         cursor = conn.cursor()
         
-        # Create table for model counts
         cursor.execute("""
             CREATE TABLE IF NOT EXISTS model_counts (
                 id INTEGER PRIMARY KEY AUTOINCREMENT,
@@ -47,7 +51,6 @@ class ModelCountTracker:
             )
         """)
         
-        # Create index for faster queries
         cursor.execute("""
             CREATE INDEX IF NOT EXISTS idx_timestamp 
             ON model_counts(timestamp)
@@ -56,27 +59,90 @@ class ModelCountTracker:
         conn.commit()
         conn.close()
     
-    def get_current_model_count(self) -> Dict:
+    def get_count_from_models_page(self) -> Optional[Dict]:
         """
-        Fetch current model count from Hugging Face Hub API.
-        Uses efficient pagination to get accurate count.
+        Get model count by scraping the Hugging Face models page.
+        Extracts count from the div with class "font-normal text-gray-400" on https://huggingface.co/models
+        or from window.__hf_deferred["numTotalItems"] in the page script.
         
         Returns:
-            Dictionary with total count and breakdowns
+            Dictionary with total_models count, or None if extraction fails
         """
         try:
-            # Use pagination to efficiently count models
-            # The API returns paginated results, so we iterate through pages
-            # For large counts, we sample and extrapolate for speed
+            url = "https://huggingface.co/models"
+            response = httpx.get(url, timeout=10.0, follow_redirects=True)
+            response.raise_for_status()
+            
+            html_content = response.text
+            
+            deferred_pattern = r'window\.__hf_deferred\["numTotalItems"\]\s*=\s*(\d+);'
+            deferred_matches = re.findall(deferred_pattern, html_content)
+            
+            if deferred_matches:
+                total_models = int(deferred_matches[0])
+                logger.info(f"Extracted model count from window.__hf_deferred: {total_models}")
+                
+                return {
+                    "total_models": total_models,
+                    "timestamp": datetime.utcnow().isoformat(),
+                    "source": "hf_models_page",
+                    "models_by_library": {},
+                    "models_by_pipeline": {},
+                    "models_by_author": {}
+                }
             
+            pattern = r'<div[^>]*class="[^"]*font-normal[^"]*text-gray-400[^"]*"[^>]*>([\d,]+)</div>'
+            matches = re.findall(pattern, html_content)
+            
+            if matches:
+                count_str = matches[0].replace(',', '')
+                total_models = int(count_str)
+                
+                logger.info(f"Extracted model count from div: {total_models}")
+                
+                return {
+                    "total_models": total_models,
+                    "timestamp": datetime.utcnow().isoformat(),
+                    "source": "hf_models_page",
+                    "models_by_library": {},
+                    "models_by_pipeline": {},
+                    "models_by_author": {}
+                }
+            
+            logger.warning("Could not find model count in HF models page HTML")
+            return None
+                
+        except httpx.HTTPError as e:
+            logger.error(f"HTTP error fetching HF models page: {e}", exc_info=True)
+            return None
+        except Exception as e:
+            logger.error(f"Error extracting count from HF models page: {e}", exc_info=True)
+            return None
+    
+    def get_current_model_count(self, use_models_page: bool = True) -> Dict:
+        """
+        Fetch current model count from Hugging Face Hub.
+        Uses multiple strategies: models page scraping (fastest), then API enumeration.
+        
+        Args:
+            use_models_page: Try to get count from HF models page first (default: True)
+        
+        Returns:
+            Dictionary with total count and breakdowns
+        """
+        if use_models_page:
+            page_count = self.get_count_from_models_page()
+            if page_count:
+                return page_count
+        
+        try:
             total_count = 0
             library_counts = {}
             pipeline_counts = {}
-            page_size = 1000  # Process in batches
-            max_pages = 100  # Limit to prevent timeout (can adjust)
-            sample_size = 10000  # Sample size for breakdowns
+            page_size = 1000
+            max_pages = 100
+            sample_size = 10000
             
-            # Count total models efficiently
             models_iter = self.api.list_models(full=False)
             sampled_models = []
             
@@ -87,25 +153,18 @@ class ModelCountTracker:
                 if i < sample_size:
                     sampled_models.append(model)
                 
-                # Safety limit to prevent infinite loops
                 if i >= max_pages * page_size:
-                    # If we hit the limit, estimate total from sample
-                    # This is a rough estimate - for exact count, increase max_pages
                     break
             
-            # Calculate breakdowns from sample (extrapolate if needed)
             for model in sampled_models:
-                # Count by library
                 if hasattr(model, 'library_name') and model.library_name:
                     lib = model.library_name
                     library_counts[lib] = library_counts.get(lib, 0) + 1
                 
-                # Count by pipeline
                 if hasattr(model, 'pipeline_tag') and model.pipeline_tag:
                     pipeline = model.pipeline_tag
                     pipeline_counts[pipeline] = pipeline_counts.get(pipeline, 0) + 1
             
-            # If we sampled, scale up the breakdowns proportionally
             if len(sampled_models) < total_count and len(sampled_models) > 0:
                 scale_factor = total_count / len(sampled_models)
                 library_counts = {k: int(v * scale_factor) for k, v in library_counts.items()}
@@ -118,7 +177,7 @@ class ModelCountTracker:
                 "timestamp": datetime.utcnow().isoformat()
             }
         except Exception as e:
-            print(f"Error fetching model count: {e}")
+            logger.error(f"Error fetching model count: {e}", exc_info=True)
             return {
                 "total_models": 0,
                 "models_by_library": {},
@@ -162,7 +221,7 @@ class ModelCountTracker:
             conn.close()
             return True
         except Exception as e:
-            print(f"Error recording count: {e}")
+            logger.error(f"Error recording count: {e}", exc_info=True)
             return False
     
     def get_historical_counts(
@@ -211,7 +270,7 @@ class ModelCountTracker:
             conn.close()
             return results
         except Exception as e:
-            print(f"Error fetching historical counts: {e}")
+            logger.error(f"Error fetching historical counts: {e}", exc_info=True)
             return []
     
     def get_latest_count(self) -> Optional[Dict]:
@@ -239,7 +298,7 @@ class ModelCountTracker:
                 }
             return None
         except Exception as e:
-            print(f"Error fetching latest count: {e}")
+            logger.error(f"Error fetching latest count: {e}", exc_info=True)
             return None
     
     def get_growth_stats(self, days: int = 7) -> Dict:
diff --git a/backend/services/model_tracker_improved.py b/backend/services/model_tracker_improved.py
index 3264597131f2039cddffd74e89346e9310f09959..685504c1abf7ae2b27f336488862659cfdf19f24 100644
--- a/backend/services/model_tracker_improved.py
+++ b/backend/services/model_tracker_improved.py
@@ -11,12 +11,17 @@ Key improvements:
 import os
 import json
 import sqlite3
+import logging
+import re
 from datetime import datetime, timedelta
 from typing import Dict, List, Optional, Tuple
 from huggingface_hub import HfApi
 import pandas as pd
 from pathlib import Path
 import time
+import httpx
+
+logger = logging.getLogger(__name__)
 
 
 class ImprovedModelCountTracker:
@@ -78,72 +83,73 @@ class ImprovedModelCountTracker:
         elapsed = (datetime.utcnow() - self._cache_timestamp).total_seconds()
         return elapsed < self.cache_ttl
     
-    def get_current_model_count(self, use_cache: bool = True, force_refresh: bool = False) -> Dict:
+    def get_current_model_count(self, use_cache: bool = True, force_refresh: bool = False, use_models_page: bool = True) -> Dict:
         """
-        Fetch current model count from Hugging Face Hub API.
-        Uses caching and efficient sampling strategies.
+        Fetch current model count from Hugging Face Hub.
+        Uses multiple strategies: models page scraping (fastest), API, or dataset snapshot.
         
         Args:
             use_cache: Whether to use cached results if available
             force_refresh: Force refresh even if cache is valid
+            use_models_page: Try to get count from HF models page first (default: True)
         
         Returns:
             Dictionary with total count and breakdowns
         """
-        # Check cache first
         if use_cache and not force_refresh and self._is_cache_valid():
             return self._cache
         
+        if use_models_page:
+            page_count = self.get_count_from_models_page()
+            if page_count:
+                dataset_count = self.get_count_from_dataset_snapshot()
+                if dataset_count and dataset_count.get("models_by_library"):
+                    page_count["models_by_library"] = dataset_count.get("models_by_library", {})
+                    page_count["models_by_pipeline"] = dataset_count.get("models_by_pipeline", {})
+                    page_count["models_by_author"] = dataset_count.get("models_by_author", {})
+                
+                self._cache = page_count
+                self._cache_timestamp = datetime.utcnow()
+                return page_count
+        
         try:
-            # Strategy 1: Try to get count efficiently using pagination
-            # The HfApi.list_models() returns an iterator, so we can count efficiently
             total_count = 0
             library_counts = {}
             pipeline_counts = {}
             author_counts = {}
             
-            # For breakdowns, we sample a subset for efficiency
-            sample_size = 20000  # Sample 20K models for breakdowns
-            max_count_for_full_breakdown = 50000  # If less than this, do full breakdown
+            sample_size = 20000
+            max_count_for_full_breakdown = 50000
             
             models_iter = self.api.list_models(full=False, sort="created", direction=-1)
             sampled_models = []
             
             start_time = time.time()
-            timeout_seconds = 30  # Don't spend more than 30 seconds
+            timeout_seconds = 30
             
             for i, model in enumerate(models_iter):
-                # Check timeout
                 if time.time() - start_time > timeout_seconds:
-                    # If we hit timeout, use sampling strategy
                     break
                 
                 total_count += 1
                 
-                # Sample models for breakdowns
                 if i < sample_size:
                     sampled_models.append(model)
                 
-                # For smaller datasets, we can do full breakdown
                 if total_count < max_count_for_full_breakdown:
-                    # Count by library
                     if hasattr(model, 'library_name') and model.library_name:
                         lib = model.library_name
                         library_counts[lib] = library_counts.get(lib, 0) + 1
                     
-                    # Count by pipeline
                     if hasattr(model, 'pipeline_tag') and model.pipeline_tag:
                         pipeline = model.pipeline_tag
                         pipeline_counts[pipeline] = pipeline_counts.get(pipeline, 0) + 1
                     
-                    # Count by author (extract from model_id)
                     if hasattr(model, 'id') and model.id:
                         author = model.id.split('/')[0] if '/' in model.id else 'unknown'
                         author_counts[author] = author_counts.get(author, 0) + 1
             
-            # If we sampled, calculate breakdowns from sample and extrapolate
             if total_count > len(sampled_models) and len(sampled_models) > 0:
-                # Calculate breakdowns from sample
                 for model in sampled_models:
                     if hasattr(model, 'library_name') and model.library_name:
                         lib = model.library_name
@@ -157,7 +163,6 @@ class ImprovedModelCountTracker:
                         author = model.id.split('/')[0] if '/' in model.id else 'unknown'
                         author_counts[author] = author_counts.get(author, 0) + 1
                 
-                # Scale up breakdowns proportionally
                 if len(sampled_models) > 0:
                     scale_factor = total_count / len(sampled_models)
                     library_counts = {k: int(v * scale_factor) for k, v in library_counts.items()}
@@ -168,20 +173,19 @@ class ImprovedModelCountTracker:
                 "total_models": total_count,
                 "models_by_library": library_counts,
                 "models_by_pipeline": pipeline_counts,
-                "models_by_author": dict(sorted(author_counts.items(), key=lambda x: x[1], reverse=True)[:20]),  # Top 20 authors
+                "models_by_author": dict(sorted(author_counts.items(), key=lambda x: x[1], reverse=True)[:20]),
                 "timestamp": datetime.utcnow().isoformat(),
                 "sampling_used": total_count > len(sampled_models) if sampled_models else False,
                 "sample_size": len(sampled_models) if sampled_models else total_count
             }
             
-            # Update cache
             self._cache = result
             self._cache_timestamp = datetime.utcnow()
             
             return result
             
         except Exception as e:
-            print(f"Error fetching model count: {e}")
+            logger.error(f"Error fetching model count: {e}", exc_info=True)
             return {
                 "total_models": 0,
                 "models_by_library": {},
@@ -191,6 +195,70 @@ class ImprovedModelCountTracker:
                 "error": str(e)
             }
     
+    def get_count_from_models_page(self) -> Optional[Dict]:
+        """
+        Get model count by scraping the Hugging Face models page.
+        Extracts count from the div with class "font-normal text-gray-400" on https://huggingface.co/models
+        
+        Returns:
+            Dictionary with total_models count, or None if extraction fails
+        """
+        try:
+            url = "https://huggingface.co/models"
+            response = httpx.get(url, timeout=10.0, follow_redirects=True)
+            response.raise_for_status()
+            
+            html_content = response.text
+            
+            # Look for the pattern: <div class="font-normal text-gray-400">2,249,310</div>
+            # The number is in the format with commas
+            pattern = r'<div[^>]*class="[^"]*font-normal[^"]*text-gray-400[^"]*"[^>]*>([\d,]+)</div>'
+            matches = re.findall(pattern, html_content)
+            
+            if matches:
+                # Take the first match and remove commas
+                count_str = matches[0].replace(',', '')
+                total_models = int(count_str)
+                
+                logger.info(f"Extracted model count from HF models page: {total_models}")
+                
+                return {
+                    "total_models": total_models,
+                    "timestamp": datetime.utcnow().isoformat(),
+                    "source": "hf_models_page",
+                    "models_by_library": {},
+                    "models_by_pipeline": {},
+                    "models_by_author": {}
+                }
+            else:
+                # Fallback: try to find the number in the window.__hf_deferred object
+                # The page has: window.__hf_deferred["numTotalItems"] = 2249312;
+                deferred_pattern = r'window\.__hf_deferred\["numTotalItems"\]\s*=\s*(\d+);'
+                deferred_matches = re.findall(deferred_pattern, html_content)
+                
+                if deferred_matches:
+                    total_models = int(deferred_matches[0])
+                    logger.info(f"Extracted model count from window.__hf_deferred: {total_models}")
+                    
+                    return {
+                        "total_models": total_models,
+                        "timestamp": datetime.utcnow().isoformat(),
+                        "source": "hf_models_page_deferred",
+                        "models_by_library": {},
+                        "models_by_pipeline": {},
+                        "models_by_author": {}
+                    }
+                
+                logger.warning("Could not find model count in HF models page HTML")
+                return None
+                
+        except httpx.HTTPError as e:
+            logger.error(f"HTTP error fetching HF models page: {e}", exc_info=True)
+            return None
+        except Exception as e:
+            logger.error(f"Error extracting count from HF models page: {e}", exc_info=True)
+            return None
+    
     def get_count_from_dataset_snapshot(self, dataset_name: str = "modelbiome/ai_ecosystem_withmodelcards") -> Optional[Dict]:
         """
         Alternative method: Get count from dataset snapshot (like ai-ecosystem repo does).
@@ -205,11 +273,9 @@ class ImprovedModelCountTracker:
         try:
             from datasets import load_dataset
             
-            # Load just metadata to get count quickly
             dataset = load_dataset(dataset_name, split="train")
             total_count = len(dataset)
             
-            # Sample for breakdowns
             sample_size = min(10000, total_count)
             sample = dataset.shuffle(seed=42).select(range(sample_size))
             
@@ -225,7 +291,6 @@ class ImprovedModelCountTracker:
                     pipeline = item['pipeline_tag']
                     pipeline_counts[pipeline] = pipeline_counts.get(pipeline, 0) + 1
             
-            # Scale up
             if sample_size < total_count:
                 scale_factor = total_count / sample_size
                 library_counts = {k: int(v * scale_factor) for k, v in library_counts.items()}
@@ -239,7 +304,7 @@ class ImprovedModelCountTracker:
                 "source": "dataset_snapshot"
             }
         except Exception as e:
-            print(f"Error loading from dataset snapshot: {e}")
+            logger.error(f"Error loading from dataset snapshot: {e}", exc_info=True)
             return None
     
     def record_count(self, count_data: Optional[Dict] = None, source: str = "api") -> bool:
@@ -279,7 +344,7 @@ class ImprovedModelCountTracker:
             conn.close()
             return True
         except Exception as e:
-            print(f"Error recording count: {e}")
+            logger.error(f"Error recording count: {e}", exc_info=True)
             return False
     
     def get_historical_counts(
@@ -329,7 +394,7 @@ class ImprovedModelCountTracker:
             conn.close()
             return results
         except Exception as e:
-            print(f"Error fetching historical counts: {e}")
+            logger.error(f"Error fetching historical counts: {e}", exc_info=True)
             return []
     
     def get_latest_count(self) -> Optional[Dict]:
@@ -358,7 +423,7 @@ class ImprovedModelCountTracker:
                 }
             return None
         except Exception as e:
-            print(f"Error fetching latest count: {e}")
+            logger.error(f"Error fetching latest count: {e}", exc_info=True)
             return None
     
     def get_growth_stats(self, days: int = 7) -> Dict:
diff --git a/backend/utils/data_loader.py b/backend/utils/data_loader.py
index 72e0a3f0a2258b8959d977e026bd457a8b54458f..f454029940b9fd7ad273022a14034bad88a50e7f 100644
--- a/backend/utils/data_loader.py
+++ b/backend/utils/data_loader.py
@@ -50,18 +50,16 @@ class ModelDataLoader:
         else:
             df = df.copy()
         
-        # Fill NaN values
         text_fields = ['tags', 'pipeline_tag', 'library_name', 'modelCard']
         for field in text_fields:
             if field in df.columns:
                 df[field] = df[field].fillna('')
         
-        # Combine text fields for embedding
         df['combined_text'] = (
             df.get('tags', '').astype(str) + ' ' +
             df.get('pipeline_tag', '').astype(str) + ' ' +
             df.get('library_name', '').astype(str) + ' ' +
-            df['modelCard'].astype(str).str[:500]  # Limit modelCard to first 500 chars
+            df['modelCard'].astype(str).str[:500]
         )
         
         return df
@@ -94,7 +92,6 @@ class ModelDataLoader:
         else:
             df = df.copy()
         
-        # Optimized filtering with vectorized operations
         if min_downloads is not None:
             downloads_col = df.get('downloads', pd.Series([0] * len(df), index=df.index))
             df = df[downloads_col >= min_downloads]
diff --git a/backend/utils/embeddings.py b/backend/utils/embeddings.py
index 61a30e0b737cbfe5957c4c67cc9680c4ad65b623..4e38f7d16e03cace63fa05796eeca55ef1670ef6 100644
--- a/backend/utils/embeddings.py
+++ b/backend/utils/embeddings.py
@@ -27,7 +27,7 @@ class ModelEmbedder:
     def generate_embeddings(
         self,
         texts: List[str],
-        batch_size: int = 128,  # Increased default batch size for speed
+        batch_size: int = 128,
         show_progress: bool = True
     ) -> np.ndarray:
         """
diff --git a/backend/utils/family_tree.py b/backend/utils/family_tree.py
new file mode 100644
index 0000000000000000000000000000000000000000..e43fc92a996b7f4e945862ec65540e9d7db52697
--- /dev/null
+++ b/backend/utils/family_tree.py
@@ -0,0 +1,66 @@
+"""Family tree utility functions."""
+import pandas as pd
+from typing import Dict
+
+def calculate_family_depths(df: pd.DataFrame) -> Dict[str, int]:
+    """Calculate family depth for each model."""
+    depths = {}
+    computing = set()
+    
+    def get_depth(model_id: str) -> int:
+        if model_id in depths:
+            return depths[model_id]
+        if model_id in computing:
+            depths[model_id] = 0
+            return 0
+        
+        computing.add(model_id)
+        
+        try:
+            if df.index.name == 'model_id':
+                row = df.loc[model_id]
+            else:
+                rows = df[df.get('model_id', '') == model_id]
+                if len(rows) == 0:
+                    depths[model_id] = 0
+                    computing.remove(model_id)
+                    return 0
+                row = rows.iloc[0]
+            
+            parent_id = row.get('parent_model')
+            if parent_id and pd.notna(parent_id):
+                parent_str = str(parent_id)
+                if parent_str != 'nan' and parent_str != '':
+                    if df.index.name == 'model_id' and parent_str in df.index:
+                        depth = get_depth(parent_str) + 1
+                    elif df.index.name != 'model_id':
+                        parent_rows = df[df.get('model_id', '') == parent_str]
+                        if len(parent_rows) > 0:
+                            depth = get_depth(parent_str) + 1
+                        else:
+                            depth = 0
+                    else:
+                        depth = 0
+                else:
+                    depth = 0
+            else:
+                depth = 0
+        except (KeyError, IndexError):
+            depth = 0
+        
+        depths[model_id] = depth
+        computing.remove(model_id)
+        return depth
+    
+    if df.index.name == 'model_id':
+        for model_id in df.index:
+            if model_id not in depths:
+                get_depth(str(model_id))
+    else:
+        for _, row in df.iterrows():
+            model_id = str(row.get('model_id', ''))
+            if model_id and model_id not in depths:
+                get_depth(model_id)
+    
+    return depths
+
diff --git a/backend/utils/graph_embeddings.py b/backend/utils/graph_embeddings.py
new file mode 100644
index 0000000000000000000000000000000000000000..e14e6fc9480b2b970eaa2130ed48f1ecd76ffee5
--- /dev/null
+++ b/backend/utils/graph_embeddings.py
@@ -0,0 +1,177 @@
+"""
+Graph-aware embeddings for hierarchical model relationships.
+Uses Node2Vec to create embeddings that respect family tree structure.
+"""
+import numpy as np
+import pandas as pd
+from typing import Dict, List, Optional, Tuple
+import networkx as nx
+import pickle
+import os
+import logging
+
+logger = logging.getLogger(__name__)
+
+try:
+    from node2vec import Node2Vec
+    NODE2VEC_AVAILABLE = True
+except ImportError:
+    NODE2VEC_AVAILABLE = False
+    logger.warning("node2vec not available. Install with: pip install node2vec")
+
+
+class GraphEmbedder:
+    """
+    Generate graph embeddings that respect hierarchical relationships.
+    Combines text embeddings with graph structure embeddings.
+    """
+    
+    def __init__(self, dimensions: int = 128, walk_length: int = 30, num_walks: int = 200):
+        """
+        Initialize graph embedder.
+        
+        Args:
+            dimensions: Embedding dimensions
+            walk_length: Length of random walks
+            num_walks: Number of walks per node
+        """
+        self.dimensions = dimensions
+        self.walk_length = walk_length
+        self.num_walks = num_walks
+        self.graph: Optional[nx.DiGraph] = None
+        self.embeddings: Optional[np.ndarray] = None
+        self.model: Optional[Node2Vec] = None
+    
+    def build_family_graph(self, df: pd.DataFrame) -> nx.DiGraph:
+        """
+        Build directed graph from family relationships.
+        
+        Args:
+            df: DataFrame with model_id and parent_model columns
+            
+        Returns:
+            NetworkX DiGraph
+        """
+        graph = nx.DiGraph()
+        
+        for idx, row in df.iterrows():
+            model_id = str(row.get('model_id', idx))
+            graph.add_node(model_id)
+            
+            parent_id = row.get('parent_model')
+            if parent_id and pd.notna(parent_id):
+                parent_str = str(parent_id)
+                if parent_str != 'nan' and parent_str != '':
+                    graph.add_edge(parent_str, model_id)
+        
+        self.graph = graph
+        logger.info(f"Built graph with {graph.number_of_nodes()} nodes and {graph.number_of_edges()} edges")
+        return graph
+    
+    def generate_graph_embeddings(
+        self,
+        graph: Optional[nx.DiGraph] = None,
+        workers: int = 4
+    ) -> Dict[str, np.ndarray]:
+        """
+        Generate Node2Vec embeddings for graph nodes.
+        
+        Args:
+            graph: NetworkX graph (uses self.graph if None)
+            workers: Number of parallel workers
+            
+        Returns:
+            Dictionary mapping model_id to embedding vector
+        """
+        if not NODE2VEC_AVAILABLE:
+            logger.warning("Node2Vec not available, returning empty embeddings")
+            return {}
+        
+        if graph is None:
+            graph = self.graph
+        
+        if graph is None or graph.number_of_nodes() == 0:
+            logger.warning("No graph available for embedding generation")
+            return {}
+        
+        try:
+            node2vec = Node2Vec(
+                graph,
+                dimensions=self.dimensions,
+                walk_length=self.walk_length,
+                num_walks=self.num_walks,
+                workers=workers
+            )
+            
+            model = node2vec.fit(window=10, min_count=1, batch_words=4)
+            self.model = model
+            
+            embeddings_dict = {}
+            for node in graph.nodes():
+                if node in model.wv:
+                    embeddings_dict[node] = model.wv[node]
+            
+            logger.info(f"Generated graph embeddings for {len(embeddings_dict)} nodes")
+            return embeddings_dict
+            
+        except Exception as e:
+            logger.error(f"Error generating graph embeddings: {e}", exc_info=True)
+            return {}
+    
+    def combine_embeddings(
+        self,
+        text_embeddings: np.ndarray,
+        graph_embeddings: Dict[str, np.ndarray],
+        model_ids: List[str],
+        text_weight: float = 0.7,
+        graph_weight: float = 0.3
+    ) -> np.ndarray:
+        """
+        Combine text and graph embeddings with weighted average.
+        
+        Args:
+            text_embeddings: Text-based embeddings (n_samples, text_dim)
+            graph_embeddings: Graph embeddings dictionary
+            model_ids: List of model IDs corresponding to text_embeddings
+            text_weight: Weight for text embeddings
+            graph_weight: Weight for graph embeddings
+            
+        Returns:
+            Combined embeddings (n_samples, combined_dim)
+        """
+        if not graph_embeddings:
+            return text_embeddings
+        
+        text_dim = text_embeddings.shape[1]
+        graph_dim = next(iter(graph_embeddings.values())).shape[0]
+        
+        combined = np.zeros((len(model_ids), text_dim + graph_dim))
+        
+        for i, model_id in enumerate(model_ids):
+            model_id_str = str(model_id)
+            
+            text_emb = text_embeddings[i]
+            graph_emb = graph_embeddings.get(model_id_str, np.zeros(graph_dim))
+            
+            normalized_text = text_emb / (np.linalg.norm(text_emb) + 1e-8)
+            normalized_graph = graph_emb / (np.linalg.norm(graph_emb) + 1e-8)
+            
+            combined[i] = np.concatenate([
+                normalized_text * text_weight,
+                normalized_graph * graph_weight
+            ])
+        
+        return combined
+    
+    def save_embeddings(self, embeddings: Dict[str, np.ndarray], filepath: str):
+        """Save graph embeddings to disk."""
+        os.makedirs(os.path.dirname(filepath) if os.path.dirname(filepath) else '.', exist_ok=True)
+        with open(filepath, 'wb') as f:
+            pickle.dump(embeddings, f)
+    
+    def load_embeddings(self, filepath: str) -> Dict[str, np.ndarray]:
+        """Load graph embeddings from disk."""
+        with open(filepath, 'rb') as f:
+            return pickle.load(f)
+
+
diff --git a/backend/utils/network_analysis.py b/backend/utils/network_analysis.py
index a82801bc183cedeabd995fc870507be4d3c9b44c..7f4983ed201ce1a784b1924c8a141f88822636d6 100644
--- a/backend/utils/network_analysis.py
+++ b/backend/utils/network_analysis.py
@@ -1,6 +1,7 @@
 """
 Network analysis module inspired by Open Syllabus Project.
 Builds co-occurrence networks for models based on shared contexts.
+Supports multiple relationship types: finetune, quantized, adapter, merge.
 """
 import pandas as pd
 import numpy as np
@@ -8,12 +9,66 @@ from collections import Counter
 from itertools import combinations
 from typing import List, Dict, Tuple, Optional, Set
 import networkx as nx
+import ast
+from datetime import datetime
+
+
+def _parse_parent_list(value) -> List[str]:
+    """
+    Parse parent model list from string/eval format.
+    Handles both string representations and actual lists.
+    """
+    if pd.isna(value) or value == '' or str(value) == 'nan':
+        return []
+    
+    try:
+        if isinstance(value, str):
+            if value.startswith('[') or value.startswith('('):
+                parsed = ast.literal_eval(value)
+            else:
+                parsed = [value]
+        else:
+            parsed = value
+        
+        if isinstance(parsed, list):
+            return [str(p) for p in parsed if p and str(p) != 'nan']
+        elif parsed:
+            return [str(parsed)]
+        else:
+            return []
+    except (ValueError, SyntaxError):
+        return []
+
+
+def _get_all_parents(row: pd.Series) -> Dict[str, List[str]]:
+    """
+    Extract all parent types from a row.
+    Returns dict mapping relationship type to list of parent IDs.
+    """
+    parents = {}
+    
+    parent_columns = {
+        'parent_model': 'parent',
+        'finetune_parent': 'finetune',
+        'quantized_parent': 'quantized',
+        'adapter_parent': 'adapter',
+        'merge_parent': 'merge'
+    }
+    
+    for col, rel_type in parent_columns.items():
+        if col in row:
+            parent_list = _parse_parent_list(row.get(col))
+            if parent_list:
+                parents[rel_type] = parent_list
+    
+    return parents
 
 
 class ModelNetworkBuilder:
     """
     Build network graphs for models based on co-occurrence patterns.
     Similar to Open Syllabus approach of connecting texts that appear together.
+    Supports multiple relationship types: finetune, quantized, adapter, merge.
     """
     
     def __init__(self, df: pd.DataFrame):
@@ -22,13 +77,13 @@ class ModelNetworkBuilder:
         
         Args:
             df: DataFrame with model data including model_id, library_name, 
-                pipeline_tag, tags, parent_model, downloads, likes
+                pipeline_tag, tags, parent_model, finetune_parent, quantized_parent,
+                adapter_parent, merge_parent, downloads, likes, createdAt
         """
         self.df = df.copy()
         if 'model_id' not in self.df.columns:
             raise ValueError("DataFrame must contain 'model_id' column")
         
-        # Ensure model_id is index for fast lookups
         if self.df.index.name != 'model_id':
             if 'model_id' in self.df.columns:
                 self.df.set_index('model_id', drop=False, inplace=True)
@@ -208,23 +263,41 @@ class ModelNetworkBuilder:
     def build_family_tree_network(
         self,
         root_model_id: str,
-        max_depth: int = 5
+        max_depth: Optional[int] = 5,
+        include_edge_attributes: bool = True,
+        filter_edge_types: Optional[List[str]] = None
     ) -> nx.DiGraph:
         """
-        Build directed graph of model family tree.
+        Build directed graph of model family tree with multiple relationship types.
         
         Args:
             root_model_id: Root model to start from
-            max_depth: Maximum depth to traverse
+            max_depth: Maximum depth to traverse. If None, traverses entire tree without limit.
+            include_edge_attributes: Whether to calculate edge attributes (change in likes, downloads, etc.)
+            filter_edge_types: List of edge types to include (e.g., ['finetune', 'quantized']). 
+                              If None, includes all types.
             
         Returns:
-            NetworkX DiGraph representing family tree
+            NetworkX DiGraph representing family tree with edge types and attributes
         """
         graph = nx.DiGraph()
         visited = set()
         
-        def add_family(current_id: str, depth: int):
-            if depth <= 0 or current_id in visited:
+        children_index: Dict[str, List[Tuple[str, str]]] = {}
+        for idx, row in self.df.iterrows():
+            model_id = str(row.get('model_id', idx))
+            all_parents = _get_all_parents(row)
+            
+            for rel_type, parent_list in all_parents.items():
+                for parent_id in parent_list:
+                    if parent_id not in children_index:
+                        children_index[parent_id] = []
+                    children_index[parent_id].append((model_id, rel_type))
+        
+        def add_family(current_id: str, depth: Optional[int]):
+            if current_id in visited:
+                return
+            if depth is not None and depth <= 0:
                 return
             visited.add(current_id)
             
@@ -233,28 +306,98 @@ class ModelNetworkBuilder:
             
             row = self.df.loc[current_id]
             
-            # Add node
             graph.add_node(str(current_id))
             graph.nodes[str(current_id)]['title'] = self._format_title(current_id)
             graph.nodes[str(current_id)]['freq'] = int(row.get('downloads', 0))
+            graph.nodes[str(current_id)]['likes'] = int(row.get('likes', 0))
+            graph.nodes[str(current_id)]['downloads'] = int(row.get('downloads', 0))
+            graph.nodes[str(current_id)]['library'] = str(row.get('library_name', '')) if pd.notna(row.get('library_name')) else ''
+            graph.nodes[str(current_id)]['pipeline'] = str(row.get('pipeline_tag', '')) if pd.notna(row.get('pipeline_tag')) else ''
             
-            # Add edge to parent
-            parent_id = row.get('parent_model')
-            if parent_id and pd.notna(parent_id) and str(parent_id) != 'nan':
-                parent_id_str = str(parent_id)
-                graph.add_edge(parent_id_str, str(current_id))
-                add_family(parent_id_str, depth - 1)
+            createdAt = row.get('createdAt')
+            if pd.notna(createdAt):
+                graph.nodes[str(current_id)]['createdAt'] = str(createdAt)
             
-            # Add edges to children
-            children = self.df[self.df.get('parent_model', '') == current_id]
-            for child_id, child_row in children.iterrows():
+            all_parents = _get_all_parents(row)
+            for rel_type, parent_list in all_parents.items():
+                if filter_edge_types and rel_type not in filter_edge_types:
+                    continue
+                
+                for parent_id in parent_list:
+                    if parent_id in self.df.index:
+                        graph.add_edge(parent_id, str(current_id))
+                        graph[parent_id][str(current_id)]['edge_types'] = [rel_type]
+                        graph[parent_id][str(current_id)]['edge_type'] = rel_type
+                        
+                        next_depth = depth - 1 if depth is not None else None
+                        add_family(parent_id, next_depth)
+            
+            children = children_index.get(current_id, [])
+            for child_id, rel_type in children:
+                if filter_edge_types and rel_type not in filter_edge_types:
+                    continue
+                
                 if str(child_id) not in visited:
-                    graph.add_edge(str(current_id), str(child_id))
-                    add_family(str(child_id), depth - 1)
+                    if not graph.has_edge(str(current_id), child_id):
+                        graph.add_edge(str(current_id), child_id)
+                        graph[str(current_id)][child_id]['edge_types'] = [rel_type]
+                        graph[str(current_id)][child_id]['edge_type'] = rel_type
+                    else:
+                        if rel_type not in graph[str(current_id)][child_id].get('edge_types', []):
+                            graph[str(current_id)][child_id]['edge_types'].append(rel_type)
+                    
+                    next_depth = depth - 1 if depth is not None else None
+                    add_family(child_id, next_depth)
         
         add_family(root_model_id, max_depth)
+        
+        if include_edge_attributes:
+            self._add_edge_attributes(graph)
+        
         return graph
     
+    def _add_edge_attributes(self, graph: nx.DiGraph):
+        """
+        Add edge attributes like change in likes, downloads, time difference.
+        Similar to the notebook's edge attribute calculation.
+        """
+        for edge in graph.edges():
+            parent_model = edge[0]
+            model_id = edge[1]
+            
+            if parent_model not in graph.nodes() or model_id not in graph.nodes():
+                continue
+            
+            parent_likes = graph.nodes[parent_model].get('likes', 0)
+            model_likes = graph.nodes[model_id].get('likes', 0)
+            parent_downloads = graph.nodes[parent_model].get('downloads', 0)
+            model_downloads = graph.nodes[model_id].get('downloads', 0)
+            
+            graph.edges[edge]['change_in_likes'] = model_likes - parent_likes
+            if parent_likes != 0:
+                graph.edges[edge]['percentage_change_in_likes'] = (model_likes - parent_likes) / parent_likes
+            else:
+                graph.edges[edge]['percentage_change_in_likes'] = np.nan
+            
+            graph.edges[edge]['change_in_downloads'] = model_downloads - parent_downloads
+            if parent_downloads != 0:
+                graph.edges[edge]['percentage_change_in_downloads'] = (model_downloads - parent_downloads) / parent_downloads
+            else:
+                graph.edges[edge]['percentage_change_in_downloads'] = np.nan
+            
+            parent_created = graph.nodes[parent_model].get('createdAt')
+            model_created = graph.nodes[model_id].get('createdAt')
+            
+            if parent_created and model_created:
+                try:
+                    parent_dt = datetime.strptime(str(parent_created), '%Y-%m-%dT%H:%M:%S.%fZ')
+                    model_dt = datetime.strptime(str(model_created), '%Y-%m-%dT%H:%M:%S.%fZ')
+                    graph.edges[edge]['change_in_createdAt_days'] = (model_dt - parent_dt).days
+                except (ValueError, TypeError):
+                    graph.edges[edge]['change_in_createdAt_days'] = np.nan
+            else:
+                graph.edges[edge]['change_in_createdAt_days'] = np.nan
+    
     def export_graphml(self, graph: nx.Graph, filename: str):
         """Export graph to GraphML format (like Open Syllabus)."""
         nx.write_graphml(graph, filename)
diff --git a/frontend/.npmrc b/frontend/.npmrc
index 8c1d73ae125936d71261229d76e34cba870dc990..7356968121dade60fef934ab95fda9fd10761283 100644
--- a/frontend/.npmrc
+++ b/frontend/.npmrc
@@ -1,2 +1,4 @@
 legacy-peer-deps=true
 
+
+
diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index 2140e6ab206bff4c53ebf3d29a263db0473beb05..74fbbb1ee5dfd4b61fe42f2cd46ed6ab481b3270 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -32,7 +32,8 @@
         "react-dom": "^18.2.0",
         "react-scripts": "5.0.1",
         "three": "^0.160.1",
-        "typescript": "^5.0.0"
+        "typescript": "^5.0.0",
+        "zustand": "^5.0.8"
       }
     },
     "node_modules/@alloc/quick-lru": {
diff --git a/frontend/package.json b/frontend/package.json
index 6c5dd299ae4098925421aa759357f3c29aa07fdc..df73512b094c59e8854eded3c1053fd2a4750ba0 100644
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -28,7 +28,8 @@
     "react-dom": "^18.2.0",
     "react-scripts": "5.0.1",
     "three": "^0.160.1",
-    "typescript": "^5.0.0"
+    "typescript": "^5.0.0",
+    "zustand": "^5.0.8"
   },
   "scripts": {
     "start": "react-scripts start",
diff --git a/frontend/public/index.html b/frontend/public/index.html
index 0a04459565a0ba5a79038d5b8ae8aec4f41feb2a..023b865876569432bbc201528bd683184f41b8b3 100644
--- a/frontend/public/index.html
+++ b/frontend/public/index.html
@@ -10,7 +10,7 @@
     />
     <link rel="preconnect" href="https://fonts.googleapis.com">
     <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
-    <link href="https://fonts.googleapis.com/css2?family=Vend+Sans:wght@300;400;500;600;700&display=swap" rel="stylesheet">
+    <link href="https://fonts.googleapis.com/css2?family=Instrument+Sans:wght@400;500;600;700&display=swap" rel="stylesheet">
     <title>Anatomy of a Machine Learning Ecosystem: 2 Million Models on Hugging Face</title>
   </head>
   <body>
diff --git a/frontend/src/App.css b/frontend/src/App.css
index a8317e31f12ae417be65760b5d5b95387dde1e0b..76b15732029dc3fd1a9ef6975b18794b5cf287b1 100644
--- a/frontend/src/App.css
+++ b/frontend/src/App.css
@@ -7,86 +7,24 @@
 }
 
 .App-header {
-  background: linear-gradient(135deg, #1a237e 0%, #283593 20%, #3949ab 40%, #5e35b1 60%, #7b1fa2 80%, #6a1b9a 100%);
-  background-size: 200% 200%;
-  animation: gradientShift 20s ease infinite;
+  background: #2d2d2d;
   color: #ffffff;
-  padding: 3rem 2.5rem;
+  padding: 2.5rem 2rem;
   text-align: center;
-  border-bottom: 2px solid rgba(100, 181, 246, 0.3);
-  box-shadow: 0 4px 20px rgba(0, 0, 0, 0.25), 0 2px 10px rgba(123, 31, 162, 0.3);
+  border-bottom: 1px solid #404040;
+  box-shadow: 0 2px 8px rgba(0, 0, 0, 0.15);
   position: relative;
-  overflow: hidden;
 }
 
-.App-header::before {
-  content: '';
-  position: absolute;
-  top: 0;
-  left: 0;
-  right: 0;
-  bottom: 0;
-  background: 
-    radial-gradient(circle at 20% 50%, rgba(100, 181, 246, 0.15) 0%, transparent 50%),
-    radial-gradient(circle at 80% 80%, rgba(156, 39, 176, 0.1) 0%, transparent 50%),
-    radial-gradient(circle at 40% 20%, rgba(33, 150, 243, 0.1) 0%, transparent 50%);
-  pointer-events: none;
-  animation: pulse 8s ease-in-out infinite;
-}
-
-.App-header::after {
-  content: '';
-  position: absolute;
-  top: 0;
-  left: 0;
-  right: 0;
-  bottom: 0;
-  background-image: 
-    repeating-linear-gradient(
-      0deg,
-      transparent,
-      transparent 2px,
-      rgba(255, 255, 255, 0.03) 2px,
-      rgba(255, 255, 255, 0.03) 4px
-    );
-  pointer-events: none;
-  opacity: 0.5;
-}
-
-@keyframes gradientShift {
-  0% {
-    background-position: 0% 50%;
-  }
-  50% {
-    background-position: 100% 50%;
-  }
-  100% {
-    background-position: 0% 50%;
-  }
-}
-
-@keyframes pulse {
-  0%, 100% {
-    opacity: 1;
-  }
-  50% {
-    opacity: 0.8;
-  }
-}
 
 .App-header h1 {
   margin: 0 0 1rem 0;
-  font-size: 2.25rem;
-  font-weight: 700;
-  letter-spacing: -0.02em;
-  line-height: 1.2;
-  position: relative;
-  z-index: 1;
-  text-shadow: 0 2px 8px rgba(0, 0, 0, 0.4), 0 4px 16px rgba(123, 31, 162, 0.3);
-  background: linear-gradient(180deg, #ffffff 0%, #e1bee7 100%);
-  -webkit-background-clip: text;
-  -webkit-text-fill-color: transparent;
-  background-clip: text;
+  font-size: 2rem;
+  font-weight: 600;
+  letter-spacing: -0.01em;
+  line-height: 1.3;
+  color: #ffffff;
+  text-shadow: 0 1px 3px rgba(0, 0, 0, 0.3);
 }
 
 .App-header p {
@@ -122,23 +60,17 @@
 }
 
 .stats span {
-  padding: 0.75rem 1.5rem;
-  background: rgba(255, 255, 255, 0.15);
-  border-radius: 12px;
-  backdrop-filter: blur(20px);
-  -webkit-backdrop-filter: blur(20px);
-  border: 2px solid rgba(255, 255, 255, 0.25);
-  transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
-  box-shadow: 0 4px 12px rgba(0, 0, 0, 0.1), inset 0 1px 0 rgba(255, 255, 255, 0.3);
-  font-weight: 600;
-  letter-spacing: 0.02em;
+  padding: 0.625rem 1.25rem;
+  background: rgba(255, 255, 255, 0.1);
+  border-radius: 6px;
+  border: 1px solid rgba(255, 255, 255, 0.2);
+  transition: all 0.2s ease;
+  font-weight: 500;
 }
 
 .stats span:hover {
-  background: rgba(255, 255, 255, 0.25);
-  transform: translateY(-2px) scale(1.05);
-  box-shadow: 0 6px 20px rgba(0, 0, 0, 0.15), inset 0 1px 0 rgba(255, 255, 255, 0.4);
-  border-color: rgba(255, 255, 255, 0.4);
+  background: rgba(255, 255, 255, 0.15);
+  transform: translateY(-1px);
 }
 
 .main-content {
@@ -149,10 +81,9 @@
 .sidebar {
   width: 340px;
   padding: 1.5rem;
-  background: linear-gradient(to bottom, #fafafa 0%, #ffffff 100%);
+  background: #fafafa;
   overflow-y: auto;
-  border-right: 2px solid #e0e0e0;
-  box-shadow: 2px 0 8px rgba(0, 0, 0, 0.05);
+  border-right: 1px solid #e0e0e0;
 }
 
 .sidebar h2 {
@@ -164,12 +95,11 @@
 }
 
 .sidebar h3 {
-  font-size: 0.95rem;
-  font-weight: 700;
-  color: #5e35b1;
-  margin: 0 0 1rem 0;
+  font-size: 0.9rem;
+  font-weight: 600;
+  color: #2d2d2d;
+  margin: 0 0 0.875rem 0;
   letter-spacing: -0.01em;
-  text-transform: none;
 }
 
 .sidebar label {
@@ -202,9 +132,8 @@
 .sidebar input[type="text"]:focus,
 .sidebar select:focus {
   outline: none;
-  border-color: #5e35b1;
-  box-shadow: 0 0 0 3px rgba(94, 53, 177, 0.12), 0 2px 6px rgba(0, 0, 0, 0.1);
-  transform: translateY(-1px);
+  border-color: #4a4a4a;
+  box-shadow: 0 0 0 2px rgba(0, 0, 0, 0.08);
 }
 
 .sidebar input[type="range"] {
@@ -227,20 +156,20 @@
 .sidebar input[type="range"]::-webkit-slider-thumb {
   -webkit-appearance: none;
   appearance: none;
-  width: 20px;
-  height: 20px;
+  width: 18px;
+  height: 18px;
   border-radius: 50%;
-  background: linear-gradient(135deg, #5e35b1 0%, #7b1fa2 100%);
+  background: #4a4a4a;
   cursor: pointer;
-  box-shadow: 0 2px 6px rgba(94, 53, 177, 0.3), 0 4px 12px rgba(94, 53, 177, 0.2);
-  transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
-  border: 3px solid #ffffff;
+  box-shadow: 0 2px 4px rgba(0, 0, 0, 0.2);
+  transition: all 0.2s ease;
+  border: 2px solid #ffffff;
 }
 
 .sidebar input[type="range"]::-webkit-slider-thumb:hover {
-  background: linear-gradient(135deg, #512da8 0%, #6a1b9a 100%);
-  transform: scale(1.2);
-  box-shadow: 0 3px 8px rgba(94, 53, 177, 0.4), 0 6px 16px rgba(94, 53, 177, 0.3);
+  background: #2d2d2d;
+  transform: scale(1.1);
+  box-shadow: 0 2px 6px rgba(0, 0, 0, 0.3);
 }
 
 .sidebar input[type="range"]::-webkit-slider-thumb:active {
@@ -248,20 +177,20 @@
 }
 
 .sidebar input[type="range"]::-moz-range-thumb {
-  width: 20px;
-  height: 20px;
+  width: 18px;
+  height: 18px;
   border-radius: 50%;
-  background: linear-gradient(135deg, #5e35b1 0%, #7b1fa2 100%);
+  background: #4a4a4a;
   cursor: pointer;
-  border: 3px solid #ffffff;
-  box-shadow: 0 2px 6px rgba(94, 53, 177, 0.3), 0 4px 12px rgba(94, 53, 177, 0.2);
-  transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
+  border: 2px solid #ffffff;
+  box-shadow: 0 2px 4px rgba(0, 0, 0, 0.2);
+  transition: all 0.2s ease;
 }
 
 .sidebar input[type="range"]::-moz-range-thumb:hover {
-  background: linear-gradient(135deg, #512da8 0%, #6a1b9a 100%);
-  transform: scale(1.2);
-  box-shadow: 0 3px 8px rgba(94, 53, 177, 0.4), 0 6px 16px rgba(94, 53, 177, 0.3);
+  background: #2d2d2d;
+  transform: scale(1.1);
+  box-shadow: 0 2px 6px rgba(0, 0, 0, 0.3);
 }
 
 .sidebar input[type="range"]::-moz-range-thumb:active {
@@ -288,17 +217,16 @@
 
 .sidebar-section {
   background: #ffffff;
-  border-radius: 8px;
+  border-radius: 6px;
   padding: 1.25rem;
-  margin-bottom: 1.25rem;
+  margin-bottom: 1rem;
   border: 1px solid #e0e0e0;
-  box-shadow: 0 1px 3px rgba(0, 0, 0, 0.08);
-  transition: all 0.3s ease;
+  transition: all 0.2s ease;
 }
 
 .sidebar-section:hover {
-  box-shadow: 0 2px 8px rgba(0, 0, 0, 0.12);
   border-color: #d0d0d0;
+  box-shadow: 0 1px 3px rgba(0, 0, 0, 0.05);
 }
 
 .filter-chip {
@@ -380,22 +308,21 @@
 }
 
 .loading {
-  color: #5e35b1;
+  color: #2d2d2d;
   font-weight: 600;
-  background: linear-gradient(135deg, #f5f3ff 0%, #ede7f6 100%);
-  border: 2px solid #d1c4e9;
-  box-shadow: 0 4px 12px rgba(94, 53, 177, 0.1);
+  background: #f5f5f5;
+  border: 1px solid #d0d0d0;
+  box-shadow: 0 2px 8px rgba(0, 0, 0, 0.08);
 }
 
 .loading::after {
   content: '';
-  width: 48px;
-  height: 48px;
-  border: 5px solid #e1bee7;
-  border-top-color: #5e35b1;
-  border-right-color: #7b1fa2;
+  width: 40px;
+  height: 40px;
+  border: 4px solid #e0e0e0;
+  border-top-color: #4a4a4a;
   border-radius: 50%;
-  animation: spin 0.8s cubic-bezier(0.68, -0.55, 0.265, 1.55) infinite;
+  animation: spin 0.8s linear infinite;
 }
 
 @keyframes spin {
@@ -403,101 +330,62 @@
 }
 
 .error {
-  color: #c62828;
-  background: linear-gradient(135deg, #ffebee 0%, #ffcdd2 100%);
-  border-radius: 12px;
-  border: 2px solid #ef5350;
+  color: #d32f2f;
+  background: #ffebee;
+  border-radius: 8px;
+  border: 1px solid #ffcdd2;
   max-width: 550px;
   margin: 0 auto;
-  box-shadow: 0 4px 12px rgba(198, 40, 40, 0.15);
   font-weight: 500;
 }
 
-.error::before {
-  content: '⚠️';
-  font-size: 2.5rem;
-  display: block;
-  margin-bottom: 0.5rem;
-}
-
 .empty {
-  color: #616161;
-  background: linear-gradient(135deg, #fafafa 0%, #f5f5f5 100%);
-  border-radius: 12px;
-  border: 2px solid #e0e0e0;
+  color: #6a6a6a;
+  background: #f5f5f5;
+  border-radius: 8px;
+  border: 1px solid #e0e0e0;
   max-width: 550px;
   margin: 0 auto;
-  box-shadow: 0 4px 12px rgba(0, 0, 0, 0.08);
   font-weight: 500;
 }
 
-.empty::before {
-  content: '🔍';
-  font-size: 2.5rem;
-  display: block;
-  margin-bottom: 0.5rem;
-}
-
 .btn {
   padding: 0.625rem 1.25rem;
-  border-radius: 6px;
+  border-radius: 4px;
   border: none;
   font-size: 0.9rem;
   font-weight: 600;
   cursor: pointer;
-  transition: all 0.25s cubic-bezier(0.4, 0, 0.2, 1);
+  transition: all 0.2s ease;
   font-family: 'Instrument Sans', sans-serif;
   display: inline-flex;
   align-items: center;
   justify-content: center;
   gap: 0.5rem;
-  position: relative;
-  overflow: hidden;
-}
-
-.btn::before {
-  content: '';
-  position: absolute;
-  top: 50%;
-  left: 50%;
-  width: 0;
-  height: 0;
-  border-radius: 50%;
-  background: rgba(255, 255, 255, 0.3);
-  transform: translate(-50%, -50%);
-  transition: width 0.6s, height 0.6s;
 }
 
-.btn:hover::before {
-  width: 300px;
-  height: 300px;
-}
 
 .btn-primary {
-  background: linear-gradient(135deg, #5e35b1 0%, #7b1fa2 100%);
+  background: #2d2d2d;
   color: white;
-  box-shadow: 0 2px 4px rgba(94, 53, 177, 0.3);
+  box-shadow: 0 2px 4px rgba(0, 0, 0, 0.15);
 }
 
 .btn-primary:hover {
-  background: linear-gradient(135deg, #512da8 0%, #6a1b9a 100%);
-  transform: translateY(-2px);
-  box-shadow: 0 4px 12px rgba(94, 53, 177, 0.4);
+  background: #1a1a1a;
+  transform: translateY(-1px);
+  box-shadow: 0 3px 8px rgba(0, 0, 0, 0.2);
 }
 
 .btn-secondary {
   background: #f5f5f5;
-  color: #1a1a1a;
-  border: 2px solid #e0e0e0;
-  box-shadow: 0 1px 3px rgba(0, 0, 0, 0.08);
+  color: #2d2d2d;
+  border: 1px solid #d0d0d0;
 }
 
 .btn-secondary:hover {
-  background: #ffffff;
-  border-color: #5e35b1;
-  color: #5e35b1;
-  transform: translateY(-1px);
-  box-shadow: 0 2px 6px rgba(0, 0, 0, 0.12);
+  background: #e8e8e8;
+  border-color: #b0b0b0;
 }
 
 .btn-small {
@@ -585,7 +473,7 @@
   --text-primary: #ffffff;
   --text-secondary: #cccccc;
   --border-color: #444444;
-  --accent-color: #64b5f6;
+  --accent-color: #4a4a4a;
 }
 
 [data-theme="light"] {
@@ -595,32 +483,31 @@
   --text-primary: #1a1a1a;
   --text-secondary: #666666;
   --border-color: #d0d0d0;
-  --accent-color: #1976d2;
+  --accent-color: #4a4a4a;
 }
 
 /* Random Model Button */
 .random-model-btn {
   display: flex;
   align-items: center;
-  gap: 0.5rem;
-  padding: 0.5rem 1rem;
-  background: var(--accent-color, #4a90e2);
+  justify-content: center;
+  padding: 0.625rem 1.25rem;
+  background: #2d2d2d;
   color: white;
   border: none;
   border-radius: 4px;
   cursor: pointer;
   font-size: 0.9rem;
   font-family: 'Instrument Sans', sans-serif;
-  font-weight: 500;
+  font-weight: 600;
   transition: all 0.2s;
   width: 100%;
-  justify-content: center;
 }
 
 .random-model-btn:hover:not(:disabled) {
-  background: var(--accent-color, #357abd);
+  background: #1a1a1a;
   transform: translateY(-1px);
-  box-shadow: 0 2px 4px rgba(0, 0, 0, 0.2);
+  box-shadow: 0 2px 6px rgba(0, 0, 0, 0.2);
 }
 
 .random-model-btn:disabled {
@@ -628,10 +515,6 @@
   cursor: not-allowed;
 }
 
-.random-icon {
-  font-size: 1.1rem;
-}
-
 /* Zoom Slider */
 .zoom-slider-container {
   margin-bottom: 1rem;
@@ -859,7 +742,7 @@
   width: 18px;
   height: 18px;
   cursor: pointer;
-  accent-color: #5e35b1;
+  accent-color: #4a4a4a;
   margin-right: 0.5rem;
 }
 
diff --git a/frontend/src/App.tsx b/frontend/src/App.tsx
index fff1c9f7e7175148d2286e21e6d02709cf7dce24..b7028115b168e32fdba258e31fafaab691d453d3 100644
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@@ -506,28 +506,24 @@ function App() {
             alignItems: 'center', 
             marginBottom: '1.5rem',
             paddingBottom: '1rem',
-            borderBottom: '2px solid #e8e8e8'
+            borderBottom: '1px solid #e0e0e0'
           }}>
             <h2 style={{ 
               margin: 0,
               fontSize: '1.5rem',
-              fontWeight: '700',
-              background: 'linear-gradient(135deg, #5e35b1 0%, #7b1fa2 100%)',
-              WebkitBackgroundClip: 'text',
-              WebkitTextFillColor: 'transparent',
-              backgroundClip: 'text'
+              fontWeight: '600',
+              color: '#2d2d2d'
             }}>
               Filters & Controls
             </h2>
             {activeFilterCount > 0 && (
               <div style={{ 
                 fontSize: '0.75rem', 
-                background: 'linear-gradient(135deg, #5e35b1 0%, #7b1fa2 100%)',
+                background: '#4a4a4a',
                 color: 'white', 
-                padding: '0.4rem 0.75rem', 
-                borderRadius: '16px',
-                fontWeight: '600',
-                boxShadow: '0 2px 6px rgba(94, 53, 177, 0.3)'
+                padding: '0.35rem 0.7rem', 
+                borderRadius: '12px',
+                fontWeight: '600'
               }}>
                 {activeFilterCount} active
               </div>
@@ -537,40 +533,40 @@ function App() {
           {/* Filter Results Count */}
           {!loading && data.length > 0 && (
             <div className="sidebar-section" style={{ 
-              background: 'linear-gradient(135deg, #f3e5f5 0%, #e1bee7 100%)',
-              border: '2px solid #ce93d8',
+              background: '#f5f5f5',
+              border: '1px solid #d0d0d0',
               fontSize: '0.9rem',
               marginBottom: '1.5rem'
             }}>
               <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', marginBottom: '0.5rem' }}>
                 <div>
-                  <strong style={{ fontSize: '1.1rem', color: '#6a1b9a' }}>
+                  <strong style={{ fontSize: '1.1rem', color: '#2d2d2d' }}>
                     {data.length.toLocaleString()}
                   </strong>
-                  <span style={{ marginLeft: '0.4rem', color: '#4a148c' }}>
+                  <span style={{ marginLeft: '0.4rem', color: '#4a4a4a' }}>
                     {data.length === 1 ? 'model' : 'models'}
                   </span>
                 </div>
                 {embeddingType === 'graph-aware' && (
                   <span style={{ 
                     fontSize: '0.7rem', 
-                    background: '#7b1fa2',
+                    background: '#4a4a4a',
                     color: 'white', 
                     padding: '0.3rem 0.6rem', 
                     borderRadius: '12px',
                     fontWeight: '600'
                   }}>
-                    🌐 Graph
+                    Graph
                   </span>
                 )}
               </div>
               {filteredCount !== null && filteredCount !== data.length && (
-                <div style={{ fontSize: '0.8rem', color: '#6a1b9a', marginTop: '0.25rem' }}>
+                <div style={{ fontSize: '0.8rem', color: '#666', marginTop: '0.25rem' }}>
                   of {filteredCount.toLocaleString()} matching
                 </div>
               )}
               {stats && filteredCount !== null && filteredCount < stats.total_models && (
-                <div style={{ fontSize: '0.75rem', color: '#8e24aa', marginTop: '0.25rem' }}>
+                <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
                   from {stats.total_models.toLocaleString()} total
                 </div>
               )}
@@ -579,15 +575,7 @@ function App() {
 
           {/* Search Section */}
           <div className="sidebar-section">
-            <h3 style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              gap: '0.5rem',
-              color: '#5e35b1',
-              marginBottom: '0.75rem'
-            }}>
-              🔍 Search Models
-            </h3>
+            <h3>Search Models</h3>
             <input
               type="text"
               value={searchQuery}
@@ -602,14 +590,7 @@ function App() {
 
           {/* Popularity Filters */}
           <div className="sidebar-section">
-            <h3 style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              gap: '0.5rem',
-              color: '#5e35b1'
-            }}>
-              📊 Popularity Filters
-            </h3>
+            <h3>Popularity Filters</h3>
             
             <label style={{ marginBottom: '1rem', display: 'block' }}>
               <div style={{ display: 'flex', justifyContent: 'space-between', marginBottom: '0.5rem' }}>
@@ -706,14 +687,7 @@ function App() {
 
           {/* Discovery */}
           <div className="sidebar-section">
-            <h3 style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              gap: '0.5rem',
-              color: '#5e35b1'
-            }}>
-              🎲 Discovery
-            </h3>
+            <h3>Discovery</h3>
             <RandomModelButton
               data={data}
               onSelect={(model: ModelPoint) => {
@@ -727,15 +701,7 @@ function App() {
           {/* Visualization Options */}
           <div className="sidebar-section">
             <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', marginBottom: '1rem' }}>
-              <h3 style={{ 
-                margin: 0,
-                display: 'flex', 
-                alignItems: 'center', 
-                gap: '0.5rem',
-                color: '#5e35b1'
-              }}>
-                🎨 Visualization
-              </h3>
+              <h3 style={{ margin: 0 }}>Visualization Options</h3>
               <ThemeToggle />
             </div>
             
@@ -862,10 +828,10 @@ function App() {
               </select>
             </label>
 
-            <div className="sidebar-section" style={{ background: '#fff3cd', borderColor: '#ffc107', marginBottom: '1rem', padding: '0.75rem', borderRadius: '4px', border: '1px solid' }}>
+            <div className="sidebar-section" style={{ background: '#f5f5f5', borderColor: '#d0d0d0', marginBottom: '1rem', padding: '0.75rem', borderRadius: '4px', border: '1px solid' }}>
               <label style={{ display: 'block', marginBottom: '0' }}>
-                <span style={{ fontWeight: '600', display: 'block', marginBottom: '0.5rem', color: '#856404' }}>
-                  ⚙️ Projection Method
+                <span style={{ fontWeight: '600', display: 'block', marginBottom: '0.5rem', color: '#2d2d2d' }}>
+                  Projection Method
                 </span>
                 <select 
                   value={projectionMethod} 
@@ -875,7 +841,7 @@ function App() {
                   <option value="umap">UMAP (better global structure)</option>
                   <option value="tsne">t-SNE (better local clusters)</option>
                 </select>
-                <div style={{ fontSize: '0.75rem', color: '#856404', marginTop: '0.5rem', lineHeight: '1.4' }}>
+                <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.5rem', lineHeight: '1.4' }}>
                   <strong>UMAP:</strong> Preserves global structure, better for exploring relationships<br/>
                   <strong>t-SNE:</strong> Emphasizes local clusters, better for finding groups
                 </div>
@@ -884,15 +850,8 @@ function App() {
           </div>
 
           {/* View Modes */}
-          <div className="sidebar-section" style={{ background: 'linear-gradient(135deg, #f3e5f5 0%, #fce4ec 100%)', border: '2px solid #f48fb1' }}>
-            <h3 style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              gap: '0.5rem',
-              color: '#5e35b1'
-            }}>
-              ⚡ View Modes
-            </h3>
+          <div className="sidebar-section">
+            <h3>View Modes</h3>
             
             <label style={{ marginBottom: '1rem', display: 'flex', alignItems: 'center', cursor: 'pointer' }}>
               <input
@@ -937,7 +896,7 @@ function App() {
                 style={{ marginRight: '0.5rem', cursor: 'pointer' }}
               />
               <div>
-                <span style={{ fontWeight: '500' }}>🌐 Graph-Aware Embeddings</span>
+                <span style={{ fontWeight: '500' }}>Graph-Aware Embeddings</span>
                 <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
                   Use embeddings that respect family tree structure. Models in the same family will be closer together.
                 </div>
@@ -955,11 +914,11 @@ function App() {
                 color: '#666'
               }}>
                 <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem', marginBottom: '0.25rem' }}>
-                  <strong style={{ color: embeddingType === 'graph-aware' ? '#2e7d32' : '#666' }}>
-                    {embeddingType === 'graph-aware' ? '🌐 Graph-Aware' : '📝 Text-Only'} Embeddings
+                  <strong style={{ color: '#2d2d2d' }}>
+                    {embeddingType === 'graph-aware' ? 'Graph-Aware' : 'Text-Only'} Embeddings
                   </strong>
                 </div>
-                <div style={{ fontSize: '0.7rem', color: '#888', lineHeight: '1.4' }}>
+                <div style={{ fontSize: '0.7rem', color: '#666', lineHeight: '1.4' }}>
                   {embeddingType === 'graph-aware' 
                     ? 'Models in the same family tree are positioned closer together, revealing hierarchical relationships.'
                     : 'Standard text-based embeddings showing semantic similarity from model descriptions and tags.'}
@@ -1006,15 +965,8 @@ function App() {
 
           {/* Structural Visualization Options */}
           {viewMode === '3d' && (
-            <div className="sidebar-section" style={{ background: 'linear-gradient(135deg, #e8f5e9 0%, #f1f8e9 100%)', border: '2px solid #aed581' }}>
-              <h3 style={{ 
-                display: 'flex', 
-                alignItems: 'center', 
-                gap: '0.5rem',
-                color: '#5e35b1'
-              }}>
-                🔗 Network Structure
-              </h3>
+            <div className="sidebar-section">
+              <h3>Network Structure</h3>
               <div style={{ fontSize: '0.75rem', color: '#666', marginBottom: '1rem', lineHeight: '1.4' }}>
                 Explore relationships and structure in the model ecosystem
               </div>
@@ -1026,12 +978,12 @@ function App() {
                   onChange={(e) => setOverviewMode(e.target.checked)}
                   style={{ marginRight: '0.5rem', cursor: 'pointer' }}
                 />
-                <div>
-                  <span style={{ fontWeight: '500' }}>🔍 Overview Mode</span>
-                  <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
-                    Zoom out to see full ecosystem structure with all relationships visible. Camera will automatically adjust.
-                  </div>
+              <div>
+                <span style={{ fontWeight: '500' }}>Overview Mode</span>
+                <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
+                  Zoom out to see full ecosystem structure with all relationships visible. Camera will automatically adjust.
                 </div>
+              </div>
               </label>
 
               <label style={{ marginBottom: '1rem', display: 'flex', alignItems: 'center', cursor: 'pointer' }}>
@@ -1041,12 +993,12 @@ function App() {
                   onChange={(e) => setShowNetworkEdges(e.target.checked)}
                   style={{ marginRight: '0.5rem', cursor: 'pointer' }}
                 />
-                <div>
-                  <span style={{ fontWeight: '500' }}>🌐 Network Relationships</span>
-                  <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
-                    Show connections between related models (same library, pipeline, or tags). Blue = library, Pink = pipeline.
-                  </div>
+              <div>
+                <span style={{ fontWeight: '500' }}>Network Relationships</span>
+                <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
+                  Show connections between related models (same library, pipeline, or tags). Blue = library, Pink = pipeline.
                 </div>
+              </div>
               </label>
 
               {showNetworkEdges && (
@@ -1073,26 +1025,19 @@ function App() {
                   onChange={(e) => setShowStructuralGroups(e.target.checked)}
                   style={{ marginRight: '0.5rem', cursor: 'pointer' }}
                 />
-                <div>
-                  <span style={{ fontWeight: '500' }}>📦 Structural Groupings</span>
-                  <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
-                    Highlight clusters and groups with wireframe boundaries. Shows top library and pipeline clusters.
-                  </div>
+              <div>
+                <span style={{ fontWeight: '500' }}>Structural Groupings</span>
+                <div style={{ fontSize: '0.75rem', color: '#666', marginTop: '0.25rem' }}>
+                  Highlight clusters and groups with wireframe boundaries. Shows top library and pipeline clusters.
                 </div>
+              </div>
               </label>
             </div>
           )}
 
           {/* Quick Filters */}
           <div className="sidebar-section">
-            <h3 style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              gap: '0.5rem',
-              color: '#5e35b1'
-            }}>
-              ⚡ Quick Actions
-            </h3>
+            <h3>Quick Actions</h3>
             <div style={{ display: 'flex', flexWrap: 'wrap', gap: '0.5rem' }}>
               <button
                 onClick={() => {
@@ -1137,14 +1082,7 @@ function App() {
           </div>
 
           <div className="sidebar-section">
-            <h3 style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              gap: '0.5rem',
-              color: '#5e35b1'
-            }}>
-              🌳 Hierarchy Navigation
-            </h3>
+            <h3>Hierarchy Navigation</h3>
             <label style={{ marginBottom: '1rem', display: 'block' }}>
               <span style={{ fontWeight: '500', display: 'block', marginBottom: '0.5rem' }}>
                 Max Hierarchy Depth
@@ -1224,14 +1162,7 @@ function App() {
           </div>
 
           <div className="sidebar-section">
-            <h3 style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              gap: '0.5rem',
-              color: '#5e35b1'
-            }}>
-              👥 Family Tree Explorer
-            </h3>
+            <h3>Family Tree Explorer</h3>
             <div style={{ position: 'relative' }}>
               <input
                 type="text"
diff --git a/frontend/src/components/FileTree.css b/frontend/src/components/FileTree.css
deleted file mode 100644
index 39ee01510cffed8056fd0f1d1382e82ff01edd75..0000000000000000000000000000000000000000
--- a/frontend/src/components/FileTree.css
+++ /dev/null
@@ -1,100 +0,0 @@
-.file-tree-container {
-  margin-top: 1rem;
-  border: 1px solid #e0e0e0;
-  border-radius: 4px;
-  background: #fafafa;
-  max-height: 400px;
-  overflow-y: auto;
-}
-
-.file-tree-header {
-  display: flex;
-  justify-content: space-between;
-  align-items: center;
-  padding: 0.75rem 1rem;
-  background: #f5f5f5;
-  border-bottom: 1px solid #e0e0e0;
-  font-size: 0.9rem;
-  font-weight: 600;
-}
-
-.file-tree-link {
-  color: #4a90e2;
-  text-decoration: none;
-  font-size: 0.85rem;
-  font-weight: 400;
-}
-
-.file-tree-link:hover {
-  text-decoration: underline;
-}
-
-.file-tree {
-  padding: 0.5rem;
-  font-family: 'Monaco', 'Menlo', 'Ubuntu Mono', monospace;
-  font-size: 0.85rem;
-}
-
-.file-tree-node {
-  margin: 0.125rem 0;
-}
-
-.file-tree-item {
-  display: flex;
-  align-items: center;
-  gap: 0.5rem;
-  padding: 0.25rem 0.5rem;
-  border-radius: 2px;
-  transition: background 0.15s;
-}
-
-.file-tree-item.directory:hover {
-  background: #e8f4f8;
-}
-
-.file-tree-item.file:hover {
-  background: #f0f0f0;
-}
-
-.file-icon {
-  font-size: 1rem;
-  width: 1.25rem;
-  text-align: center;
-}
-
-.file-name {
-  flex: 1;
-  color: #1a1a1a;
-  word-break: break-all;
-}
-
-.file-size {
-  color: #666;
-  font-size: 0.8rem;
-  margin-left: auto;
-}
-
-.file-expand {
-  color: #666;
-  font-size: 0.7rem;
-  width: 0.75rem;
-  text-align: center;
-}
-
-.file-tree-children {
-  margin-left: 0.5rem;
-}
-
-.file-tree-loading,
-.file-tree-error,
-.file-tree-empty {
-  padding: 1rem;
-  text-align: center;
-  color: #666;
-  font-size: 0.9rem;
-}
-
-.file-tree-error {
-  color: #d32f2f;
-}
-
diff --git a/frontend/src/components/FileTree.tsx b/frontend/src/components/FileTree.tsx
deleted file mode 100644
index bb810f1da6e162fa36581bd2afc23df720169c7f..0000000000000000000000000000000000000000
--- a/frontend/src/components/FileTree.tsx
+++ /dev/null
@@ -1,221 +0,0 @@
-/**
- * File tree component for displaying model file structure.
- * Fetches and displays files from Hugging Face model repository.
- */
-import React, { useState, useEffect } from 'react';
-import './FileTree.css';
-
-interface FileNode {
-  path: string;
-  type: 'file' | 'directory';
-  size?: number;
-  children?: FileNode[];
-}
-
-interface FileTreeProps {
-  modelId: string;
-}
-
-export default function FileTree({ modelId }: FileTreeProps) {
-  const [files, setFiles] = useState<FileNode[]>([]);
-  const [loading, setLoading] = useState(true);
-  const [error, setError] = useState<string | null>(null);
-  const [expandedPaths, setExpandedPaths] = useState<Set<string>>(new Set());
-
-  useEffect(() => {
-    const fetchFiles = async () => {
-      setLoading(true);
-      setError(null);
-      try {
-        // Fetch file tree through our backend API (avoids CORS issues)
-        // Use same API base as main app
-        const apiBase = (window as any).__API_BASE__ || process.env.REACT_APP_API_URL || 'http://localhost:8000';
-        const response = await fetch(
-          `${apiBase}/api/model/${encodeURIComponent(modelId)}/files?branch=main`
-        );
-
-        if (!response.ok) {
-          throw new Error('File tree not available for this model');
-        }
-
-        const data = await response.json();
-        
-        // Convert flat list to tree structure
-        const tree = buildFileTree(data);
-        setFiles(tree);
-      } catch (err: any) {
-        setError(err instanceof Error ? err.message : 'Failed to load files');
-        console.error('Error fetching file tree:', err);
-      } finally {
-        setLoading(false);
-      }
-    };
-
-    if (modelId) {
-      fetchFiles();
-    }
-  }, [modelId]);
-
-  const buildFileTree = (fileList: any[]): FileNode[] => {
-    const tree: FileNode[] = [];
-    const pathMap = new Map<string, FileNode>();
-
-    // Sort files by path
-    const sortedFiles = [...fileList].sort((a, b) => a.path.localeCompare(b.path));
-
-    for (const file of sortedFiles) {
-      const parts = file.path.split('/');
-      let currentPath = '';
-      let parent: FileNode | null = null;
-
-      for (let i = 0; i < parts.length; i++) {
-        const part = parts[i];
-        currentPath = currentPath ? `${currentPath}/${part}` : part;
-
-        if (!pathMap.has(currentPath)) {
-          const isDirectory = i < parts.length - 1;
-          const node: FileNode = {
-            path: currentPath,
-            type: isDirectory ? 'directory' : 'file',
-            size: file.size,
-            children: isDirectory ? [] : undefined,
-          };
-
-          pathMap.set(currentPath, node);
-
-          if (parent) {
-            parent.children!.push(node);
-          } else {
-            tree.push(node);
-          }
-
-          parent = node;
-        } else {
-          parent = pathMap.get(currentPath)!;
-        }
-      }
-    }
-
-    return tree;
-  };
-
-  const toggleExpand = (path: string) => {
-    setExpandedPaths((prev) => {
-      const next = new Set(prev);
-      if (next.has(path)) {
-        next.delete(path);
-      } else {
-        next.add(path);
-      }
-      return next;
-    });
-  };
-
-  const formatFileSize = (bytes?: number): string => {
-    if (!bytes) return '';
-    if (bytes < 1024) return `${bytes} B`;
-    if (bytes < 1024 * 1024) return `${(bytes / 1024).toFixed(1)} KB`;
-    if (bytes < 1024 * 1024 * 1024) return `${(bytes / (1024 * 1024)).toFixed(1)} MB`;
-    return `${(bytes / (1024 * 1024 * 1024)).toFixed(1)} GB`;
-  };
-
-  const getFileIcon = (node: FileNode): string => {
-    if (node.type === 'directory') {
-      return expandedPaths.has(node.path) ? '📂' : '📁';
-    }
-    const ext = node.path.split('.').pop()?.toLowerCase();
-    const iconMap: Record<string, string> = {
-      'py': '🐍',
-      'json': '📄',
-      'txt': '📝',
-      'md': '📖',
-      'yml': '⚙️',
-      'yaml': '⚙️',
-      'bin': '💾',
-      'safetensors': '🔒',
-      'pt': '🔥',
-      'pth': '🔥',
-      'onnx': '🧠',
-      'pb': '🧠',
-    };
-    return iconMap[ext || ''] || '📄';
-  };
-
-  const renderNode = (node: FileNode, depth: number = 0): React.ReactNode => {
-    const isExpanded = expandedPaths.has(node.path);
-    const hasChildren = node.children && node.children.length > 0;
-
-    return (
-      <div key={node.path} className="file-tree-node" style={{ paddingLeft: `${depth * 1.5}rem` }}>
-        <div
-          className={`file-tree-item ${node.type} ${isExpanded ? 'expanded' : ''}`}
-          onClick={() => node.type === 'directory' && toggleExpand(node.path)}
-          style={{ cursor: node.type === 'directory' ? 'pointer' : 'default' }}
-        >
-          <span className="file-icon">{getFileIcon(node)}</span>
-          <span className="file-name">{node.path.split('/').pop()}</span>
-          {node.type === 'file' && node.size && (
-            <span className="file-size">{formatFileSize(node.size)}</span>
-          )}
-          {node.type === 'directory' && (
-            <span className="file-expand">{isExpanded ? '▼' : '▶'}</span>
-          )}
-        </div>
-        {isExpanded && hasChildren && (
-          <div className="file-tree-children">
-            {node.children!.map((child) => renderNode(child, depth + 1))}
-          </div>
-        )}
-      </div>
-    );
-  };
-
-  if (loading) {
-    return (
-      <div className="file-tree-container">
-        <div className="file-tree-loading">Loading file tree...</div>
-      </div>
-    );
-  }
-
-  if (error) {
-    return (
-      <div className="file-tree-container">
-        <div className="file-tree-error">
-          {error}
-          <div style={{ marginTop: '0.5rem', fontSize: '0.85rem', color: '#666' }}>
-            File tree may not be available for this model.
-          </div>
-        </div>
-      </div>
-    );
-  }
-
-  if (files.length === 0) {
-    return (
-      <div className="file-tree-container">
-        <div className="file-tree-empty">No files found</div>
-      </div>
-    );
-  }
-
-  return (
-    <div className="file-tree-container">
-      <div className="file-tree-header">
-        <strong>Repository Files</strong>
-        <a
-          href={`https://huggingface.co/${modelId}/tree/main`}
-          target="_blank"
-          rel="noopener noreferrer"
-          className="file-tree-link"
-        >
-          View on Hugging Face →
-        </a>
-      </div>
-      <div className="file-tree">
-        {files.map((node) => renderNode(node))}
-      </div>
-    </div>
-  );
-}
-
diff --git a/frontend/src/components/PaperPlots.css b/frontend/src/components/PaperPlots.css
deleted file mode 100644
index c37837570a4c50827d32c09920302d61872bb8d4..0000000000000000000000000000000000000000
--- a/frontend/src/components/PaperPlots.css
+++ /dev/null
@@ -1,92 +0,0 @@
-.paper-plots {
-  display: flex;
-  flex-direction: column;
-  gap: 1rem;
-  padding: 1rem;
-  background: white;
-  border-radius: 8px;
-  box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);
-}
-
-.plot-selector {
-  border-bottom: 1px solid #e0e0e0;
-  padding-bottom: 1rem;
-}
-
-.plot-selector h3 {
-  margin: 0 0 0.75rem 0;
-  font-size: 1.25rem;
-  color: #333;
-}
-
-.plot-buttons {
-  display: flex;
-  flex-wrap: wrap;
-  gap: 0.5rem;
-}
-
-.plot-button {
-  padding: 0.5rem 1rem;
-  border: 1px solid #ccc;
-  background: white;
-  border-radius: 4px;
-  cursor: pointer;
-  font-size: 0.875rem;
-  transition: all 0.2s;
-  color: #333;
-}
-
-.plot-button:hover {
-  background: #f5f5f5;
-  border-color: #999;
-}
-
-.plot-button.active {
-  background: #4a90e2;
-  color: white;
-  border-color: #4a90e2;
-}
-
-.plot-container {
-  position: relative;
-  min-height: 600px;
-  display: flex;
-  align-items: center;
-  justify-content: center;
-}
-
-.plot-loading {
-  position: absolute;
-  top: 50%;
-  left: 50%;
-  transform: translate(-50%, -50%);
-  color: #666;
-  font-size: 1rem;
-}
-
-.plot-tooltip {
-  position: absolute;
-  padding: 0.5rem;
-  background: rgba(0, 0, 0, 0.8);
-  color: white;
-  border-radius: 4px;
-  pointer-events: none;
-  font-size: 0.875rem;
-  z-index: 1000;
-}
-
-.plot-container svg {
-  display: block;
-  margin: 0 auto;
-}
-
-@media (max-width: 768px) {
-  .plot-buttons {
-    flex-direction: column;
-  }
-
-  .plot-button {
-    width: 100%;
-  }
-}
-
diff --git a/frontend/src/components/PaperPlots.tsx b/frontend/src/components/PaperPlots.tsx
deleted file mode 100644
index 96a4881f853d6fa6efdf73acc75524e4fe22d71f..0000000000000000000000000000000000000000
--- a/frontend/src/components/PaperPlots.tsx
+++ /dev/null
@@ -1,755 +0,0 @@
-/**
- * Interactive D3.js visualizations based on plots from the research paper.
- * "Anatomy of a Machine Learning Ecosystem: 2 Million Models on Hugging Face"
- */
-import React, { useRef, useEffect, useState, useMemo } from 'react';
-import * as d3 from 'd3';
-import { ModelPoint } from '../types';
-import './PaperPlots.css';
-
-const API_BASE = process.env.REACT_APP_API_URL || 'http://localhost:8000';
-
-interface PaperPlotsProps {
-  data: ModelPoint[];
-  width?: number;
-  height?: number;
-}
-
-type PlotType = 'family-size' | 'similarity-comparison' | 'license-drift' | 'model-card-length' | 'growth-timeline';
-
-export default function PaperPlots({ data, width = 800, height = 600 }: PaperPlotsProps) {
-  const [activePlot, setActivePlot] = useState<PlotType>('family-size');
-  const familySizeRef = useRef<SVGSVGElement>(null);
-  const similarityRef = useRef<SVGSVGElement>(null);
-  const licenseDriftRef = useRef<SVGSVGElement>(null);
-  const modelCardLengthRef = useRef<SVGSVGElement>(null);
-  const growthTimelineRef = useRef<SVGSVGElement>(null);
-  const [familyTreeData, setFamilyTreeData] = useState<any>(null);
-  const [loading, setLoading] = useState(false);
-
-  // Fetch family tree statistics
-  useEffect(() => {
-    const fetchFamilyStats = async () => {
-      setLoading(true);
-      try {
-        const response = await fetch(`${API_BASE}/api/family/stats`);
-        if (response.ok) {
-          const stats = await response.json();
-          setFamilyTreeData(stats);
-        }
-      } catch (err) {
-        console.error('Error fetching family stats:', err);
-      } finally {
-        setLoading(false);
-      }
-    };
-    fetchFamilyStats();
-  }, []);
-
-  // Plot 1: Family Size Distribution
-  useEffect(() => {
-    if (activePlot !== 'family-size' || !familySizeRef.current) return;
-
-    const svg = d3.select(familySizeRef.current);
-    svg.selectAll('*').remove();
-
-    const margin = { top: 40, right: 40, bottom: 60, left: 60 };
-    const innerWidth = width - margin.left - margin.right;
-    const innerHeight = height - margin.top - margin.bottom;
-
-    // Use API data if available, otherwise calculate from current data
-    let binData: Array<{ x0: number; x1: number; count: number }>;
-    
-    if (familyTreeData && familyTreeData.family_size_distribution) {
-      const sizeDist = familyTreeData.family_size_distribution;
-      const sizes = Object.keys(sizeDist).map(Number);
-      const counts = Object.values(sizeDist) as number[];
-      
-      // Create histogram bins from distribution
-      const maxSize = d3.max(sizes) || 1;
-      const bins = d3.bin().thresholds(20).domain([0, maxSize])(sizes);
-      
-      binData = bins.map(bin => {
-        let count = 0;
-        sizes.forEach((size, i) => {
-          if (size >= (bin.x0 || 0) && size < (bin.x1 || maxSize)) {
-            count += counts[i];
-          }
-        });
-        return {
-          x0: bin.x0 || 0,
-          x1: bin.x1 || maxSize,
-          count: count
-        };
-      }).filter(d => d.count > 0);
-    } else {
-      // Fallback: Calculate from current data
-      const familySizes = new Map<string, number>();
-      data.forEach(model => {
-        const familyKey = model.parent_model || model.model_id;
-        familySizes.set(familyKey, (familySizes.get(familyKey) || 0) + 1);
-      });
-
-      const sizes = Array.from(familySizes.values());
-      const bins = d3.bin().thresholds(20)(sizes);
-      binData = bins.map(bin => ({
-        x0: bin.x0 || 0,
-        x1: bin.x1 || 0,
-        count: bin.length
-      }));
-    }
-
-    const g = svg.append('g')
-      .attr('transform', `translate(${margin.left},${margin.top})`);
-
-    // Scales
-    const xScale = d3.scaleLinear()
-      .domain([0, d3.max(binData, d => d.x1) || 1])
-      .range([0, innerWidth])
-      .nice();
-
-    const yScale = d3.scaleLinear()
-      .domain([0, d3.max(binData, d => d.count) || 1])
-      .range([innerHeight, 0])
-      .nice();
-
-    // Bars
-    g.selectAll('rect')
-      .data(binData)
-      .enter()
-      .append('rect')
-      .attr('x', d => xScale(d.x0))
-      .attr('width', d => Math.max(0, xScale(d.x1) - xScale(d.x0) - 1))
-      .attr('y', d => yScale(d.count))
-      .attr('height', d => innerHeight - yScale(d.count))
-      .attr('fill', '#4a90e2')
-      .attr('opacity', 0.7)
-      .on('mouseover', function(event, d) {
-        d3.select(this).attr('opacity', 1);
-        const tooltip = d3.select('body').append('div')
-          .attr('class', 'plot-tooltip')
-          .style('opacity', 0);
-        tooltip.transition().duration(200).style('opacity', 0.9);
-        tooltip.html(`Family Size: ${d.x0.toFixed(0)}-${d.x1.toFixed(0)}<br/>Count: ${d.count}`)
-          .style('left', (event.pageX + 10) + 'px')
-          .style('top', (event.pageY - 28) + 'px');
-      })
-      .on('mouseout', function() {
-        d3.select(this).attr('opacity', 0.7);
-        d3.selectAll('.plot-tooltip').remove();
-      });
-
-    // Axes
-    const xAxis = d3.axisBottom(xScale).tickFormat(d3.format('d'));
-    const yAxis = d3.axisLeft(yScale);
-
-    g.append('g')
-      .attr('transform', `translate(0,${innerHeight})`)
-      .call(xAxis)
-      .append('text')
-      .attr('x', innerWidth / 2)
-      .attr('y', 45)
-      .attr('fill', 'currentColor')
-      .style('text-anchor', 'middle')
-      .style('font-size', '14px')
-      .text('Family Size (number of models)');
-
-    g.append('g')
-      .call(yAxis)
-      .append('text')
-      .attr('transform', 'rotate(-90)')
-      .attr('y', -45)
-      .attr('x', -innerHeight / 2)
-      .attr('fill', 'currentColor')
-      .style('text-anchor', 'middle')
-      .style('font-size', '14px')
-      .text('Number of Families');
-
-    // Title
-    svg.append('text')
-      .attr('x', width / 2)
-      .attr('y', 20)
-      .attr('text-anchor', 'middle')
-      .style('font-size', '16px')
-      .style('font-weight', 'bold')
-      .text('Family Size Distribution');
-
-  }, [activePlot, data, width, height, familyTreeData]);
-
-  // Plot 2: Similarity Comparison (Sibling vs Parent-Child)
-  useEffect(() => {
-    if (activePlot !== 'similarity-comparison' || !similarityRef.current || !data.length) return;
-
-    const svg = d3.select(similarityRef.current);
-    svg.selectAll('*').remove();
-
-    const margin = { top: 40, right: 40, bottom: 60, left: 60 };
-    const innerWidth = width - margin.left - margin.right;
-    const innerHeight = height - margin.top - margin.bottom;
-
-    // This would require similarity data - for now, create a placeholder visualization
-    // In the paper, this shows that siblings are more similar than parent-child pairs
-    const g = svg.append('g')
-      .attr('transform', `translate(${margin.left},${margin.top})`);
-
-    // Placeholder: Box plot or violin plot showing similarity distributions
-    // Sibling similarity (higher)
-    const siblingData = Array.from({ length: 100 }, () => 0.6 + Math.random() * 0.3);
-    // Parent-child similarity (lower)
-    const parentChildData = Array.from({ length: 100 }, () => 0.3 + Math.random() * 0.3);
-
-    const xScale = d3.scaleBand()
-      .domain(['Sibling Pairs', 'Parent-Child Pairs'])
-      .range([0, innerWidth])
-      .padding(0.3);
-
-    const yScale = d3.scaleLinear()
-      .domain([0, 1])
-      .range([innerHeight, 0])
-      .nice();
-
-    // Box plot visualization
-    [siblingData, parentChildData].forEach((dataset, i) => {
-      const label = i === 0 ? 'Sibling Pairs' : 'Parent-Child Pairs';
-      const x = xScale(label);
-      const bandWidth = xScale.bandwidth();
-
-      if (x === undefined) return;
-
-      // Calculate quartiles
-      const sorted = dataset.sort((a, b) => a - b);
-      const q1 = d3.quantile(sorted, 0.25) || 0;
-      const q2 = d3.quantile(sorted, 0.5) || 0;
-      const q3 = d3.quantile(sorted, 0.75) || 0;
-      const min = sorted[0];
-      const max = sorted[sorted.length - 1];
-
-      // Box
-      g.append('rect')
-        .attr('x', x)
-        .attr('y', yScale(q3))
-        .attr('width', bandWidth)
-        .attr('height', yScale(q1) - yScale(q3))
-        .attr('fill', i === 0 ? '#4a90e2' : '#e24a4a')
-        .attr('opacity', 0.6)
-        .attr('stroke', '#333')
-        .attr('stroke-width', 1);
-
-      // Median line
-      g.append('line')
-        .attr('x1', x)
-        .attr('x2', x + bandWidth)
-        .attr('y1', yScale(q2))
-        .attr('y2', yScale(q2))
-        .attr('stroke', '#333')
-        .attr('stroke-width', 2);
-
-      // Whiskers
-      g.append('line')
-        .attr('x1', x + bandWidth / 2)
-        .attr('x2', x + bandWidth / 2)
-        .attr('y1', yScale(min))
-        .attr('y2', yScale(q1))
-        .attr('stroke', '#333')
-        .attr('stroke-width', 1);
-
-      g.append('line')
-        .attr('x1', x + bandWidth / 2)
-        .attr('x2', x + bandWidth / 2)
-        .attr('y1', yScale(q3))
-        .attr('y2', yScale(max))
-        .attr('stroke', '#333')
-        .attr('stroke-width', 1);
-
-      // Min/Max lines
-      g.append('line')
-        .attr('x1', x + bandWidth * 0.25)
-        .attr('x2', x + bandWidth * 0.75)
-        .attr('y1', yScale(min))
-        .attr('y2', yScale(min))
-        .attr('stroke', '#333')
-        .attr('stroke-width', 1);
-
-      g.append('line')
-        .attr('x1', x + bandWidth * 0.25)
-        .attr('x2', x + bandWidth * 0.75)
-        .attr('y1', yScale(max))
-        .attr('y2', yScale(max))
-        .attr('stroke', '#333')
-        .attr('stroke-width', 1);
-    });
-
-    // Axes
-    const yAxis = d3.axisLeft(yScale);
-    g.append('g').call(yAxis);
-
-    g.append('text')
-      .attr('transform', 'rotate(-90)')
-      .attr('y', -45)
-      .attr('x', -innerHeight / 2)
-      .attr('fill', 'currentColor')
-      .style('text-anchor', 'middle')
-      .style('font-size', '14px')
-      .text('Similarity Score');
-
-    // Title
-    svg.append('text')
-      .attr('x', width / 2)
-      .attr('y', 20)
-      .attr('text-anchor', 'middle')
-      .style('font-size', '16px')
-      .style('font-weight', 'bold')
-      .text('Similarity: Siblings vs Parent-Child Pairs');
-
-  }, [activePlot, data, width, height, familyTreeData]);
-
-  // Plot 3: License Drift (over family depth)
-  useEffect(() => {
-    if (activePlot !== 'license-drift' || !licenseDriftRef.current || !data.length) return;
-
-    const svg = d3.select(licenseDriftRef.current);
-    svg.selectAll('*').remove();
-
-    const margin = { top: 40, right: 40, bottom: 60, left: 80 };
-    const innerWidth = width - margin.left - margin.right;
-    const innerHeight = height - margin.top - margin.bottom;
-
-    // Group by family depth and license type
-    const depthGroups = new Map<number, Map<string, number>>();
-    data.forEach(model => {
-      const depth = model.family_depth || 0;
-      const license = model.licenses ? (model.licenses.split(',')[0].trim() || 'unknown') : 'unknown';
-      
-      if (!depthGroups.has(depth)) {
-        depthGroups.set(depth, new Map());
-      }
-      const licenseMap = depthGroups.get(depth)!;
-      licenseMap.set(license, (licenseMap.get(license) || 0) + 1);
-    });
-
-    const depths = Array.from(depthGroups.keys()).sort((a, b) => a - b);
-    const allLicenses = new Set<string>();
-    depthGroups.forEach(licenseMap => {
-      licenseMap.forEach((_, license) => allLicenses.add(license));
-    });
-
-    const licenseTypes = Array.from(allLicenses).slice(0, 5); // Top 5 licenses
-    const colorScale = d3.scaleOrdinal(d3.schemeCategory10).domain(licenseTypes);
-
-    const g = svg.append('g')
-      .attr('transform', `translate(${margin.left},${margin.top})`);
-
-    const xScale = d3.scaleBand()
-      .domain(depths.map(d => d.toString()))
-      .range([0, innerWidth])
-      .padding(0.1);
-
-    const yScale = d3.scaleLinear()
-      .domain([0, 1])
-      .range([innerHeight, 0]);
-
-    // Stacked area or bars showing license distribution
-    licenseTypes.forEach((license, i) => {
-      const stack = depths.map(depth => {
-        const licenseMap = depthGroups.get(depth) || new Map();
-        const total = Array.from(licenseMap.values()).reduce((a, b) => a + b, 0);
-        const count = licenseMap.get(license) || 0;
-        return { depth, proportion: total > 0 ? count / total : 0 };
-      });
-
-      // Draw as line chart showing proportion over depth
-      const line = d3.line<{ depth: number; proportion: number }>()
-        .x(d => (xScale(d.depth.toString()) || 0) + xScale.bandwidth() / 2)
-        .y(d => yScale(d.proportion))
-        .curve(d3.curveMonotoneX);
-
-      g.append('path')
-        .datum(stack)
-        .attr('fill', 'none')
-        .attr('stroke', colorScale(license))
-        .attr('stroke-width', 2)
-        .attr('d', line);
-
-      // Add circles for data points
-      g.selectAll(`.dot-${i}`)
-        .data(stack)
-        .enter()
-        .append('circle')
-        .attr('cx', d => (xScale(d.depth.toString()) || 0) + xScale.bandwidth() / 2)
-        .attr('cy', d => yScale(d.proportion))
-        .attr('r', 4)
-        .attr('fill', colorScale(license));
-    });
-
-    // Axes
-    const xAxis = d3.axisBottom(xScale);
-    const yAxis = d3.axisLeft(yScale).tickFormat(d3.format('.0%'));
-
-    g.append('g')
-      .attr('transform', `translate(0,${innerHeight})`)
-      .call(xAxis)
-      .append('text')
-      .attr('x', innerWidth / 2)
-      .attr('y', 45)
-      .attr('fill', 'currentColor')
-      .style('text-anchor', 'middle')
-      .style('font-size', '14px')
-      .text('Family Depth (generation)');
-
-    g.append('g').call(yAxis)
-      .append('text')
-      .attr('transform', 'rotate(-90)')
-      .attr('y', -60)
-      .attr('x', -innerHeight / 2)
-      .attr('fill', 'currentColor')
-      .style('text-anchor', 'middle')
-      .style('font-size', '14px')
-      .text('Proportion of Models');
-
-    // Legend
-    const legend = g.append('g')
-      .attr('transform', `translate(${innerWidth - 150}, 20)`);
-
-    licenseTypes.forEach((license, i) => {
-      const legendRow = legend.append('g')
-        .attr('transform', `translate(0, ${i * 20})`);
-
-      legendRow.append('rect')
-        .attr('width', 15)
-        .attr('height', 15)
-        .attr('fill', colorScale(license));
-
-      legendRow.append('text')
-        .attr('x', 20)
-        .attr('y', 12)
-        .style('font-size', '12px')
-        .text(license.length > 15 ? license.substring(0, 15) + '...' : license);
-    });
-
-    // Title
-    svg.append('text')
-      .attr('x', width / 2)
-      .attr('y', 20)
-      .attr('text-anchor', 'middle')
-      .style('font-size', '16px')
-      .style('font-weight', 'bold')
-      .text('License Distribution Across Family Generations');
-
-  }, [activePlot, data, width, height, familyTreeData]);
-
-  // Plot 4: Model Card Length Distribution
-  useEffect(() => {
-    if (activePlot !== 'model-card-length' || !modelCardLengthRef.current || !data.length) return;
-
-    const svg = d3.select(modelCardLengthRef.current);
-    svg.selectAll('*').remove();
-
-    const margin = { top: 40, right: 40, bottom: 60, left: 60 };
-    const innerWidth = width - margin.left - margin.right;
-    const innerHeight = height - margin.top - margin.bottom;
-
-    // Placeholder: Would need model card length data
-    // In the paper, this shows model cards getting shorter and more standardized
-    const g = svg.append('g')
-      .attr('transform', `translate(${margin.left},${margin.top})`);
-
-    // Use real model card length data from API if available
-    let depthData = new Map<number, number[]>();
-    
-    if (familyTreeData && familyTreeData.model_card_length_by_depth) {
-      // Use real data from API
-      const cardStats = familyTreeData.model_card_length_by_depth;
-      Object.keys(cardStats).forEach(depthStr => {
-        const depth = parseInt(depthStr);
-        const stats = cardStats[depthStr];
-        // Create synthetic distribution from stats (mean, q1, q3)
-        const lengths: number[] = [];
-        const count = Math.min(stats.count, 100); // Limit for performance
-        for (let i = 0; i < count; i++) {
-          // Generate values around the mean with spread based on quartiles
-          const spread = (stats.q3 - stats.q1) / 2;
-          const length = stats.mean + (Math.random() - 0.5) * spread * 2;
-          lengths.push(Math.max(0, length));
-        }
-        depthData.set(depth, lengths);
-      });
-    } else {
-      // Fallback: Calculate from current data
-      const depthGroups = new Map<number, number[]>();
-      data.forEach(model => {
-        const depth = model.family_depth || 0;
-        // We don't have model card length in ModelPoint, so use placeholder
-        // In a real implementation, this would come from the API
-        if (!depthGroups.has(depth)) {
-          depthGroups.set(depth, []);
-        }
-      });
-      depthData = depthGroups;
-    }
-    
-    // If still no data, use simulated data
-    if (depthData.size === 0) {
-      for (let depth = 0; depth <= 5; depth++) {
-        const lengths = Array.from({ length: 50 }, () => {
-          const baseLength = 2000 - depth * 200;
-          return baseLength + (Math.random() - 0.5) * 500;
-        });
-        depthData.set(depth, lengths);
-      }
-    }
-
-    const depths = Array.from(depthData.keys()).sort((a, b) => a - b);
-    const maxDepth = d3.max(depths) || 5;
-    const allLengths = Array.from(depthData.values()).flat();
-    const maxLength = d3.max(allLengths) || 3000;
-
-    const xScale = d3.scaleBand()
-      .domain(depths.map(d => d.toString()))
-      .range([0, innerWidth])
-      .padding(0.2);
-
-    const yScale = d3.scaleLinear()
-      .domain([0, maxLength])
-      .range([innerHeight, 0])
-      .nice();
-
-    // Violin plot or box plot
-    depthData.forEach((lengths, depth) => {
-      const x = xScale(depth.toString());
-      const bandWidth = xScale.bandwidth();
-
-      if (x === undefined) return;
-
-      // Simple box plot
-      const sorted = lengths.sort((a, b) => a - b);
-      const q1 = d3.quantile(sorted, 0.25) || 0;
-      const q2 = d3.quantile(sorted, 0.5) || 0;
-      const q3 = d3.quantile(sorted, 0.75) || 0;
-
-      g.append('rect')
-        .attr('x', x)
-        .attr('y', yScale(q3))
-        .attr('width', bandWidth)
-        .attr('height', yScale(q1) - yScale(q3))
-        .attr('fill', '#4a90e2')
-        .attr('opacity', 0.6)
-        .attr('stroke', '#333');
-
-      g.append('line')
-        .attr('x1', x)
-        .attr('x2', x + bandWidth)
-        .attr('y1', yScale(q2))
-        .attr('y2', yScale(q2))
-        .attr('stroke', '#333')
-        .attr('stroke-width', 2);
-    });
-
-    const yAxis = d3.axisLeft(yScale);
-    g.append('g').call(yAxis)
-      .append('text')
-      .attr('transform', 'rotate(-90)')
-      .attr('y', -45)
-      .attr('x', -innerHeight / 2)
-      .attr('fill', 'currentColor')
-      .style('text-anchor', 'middle')
-      .style('font-size', '14px')
-      .text('Model Card Length (characters)');
-
-    // Title
-    svg.append('text')
-      .attr('x', width / 2)
-      .attr('y', 20)
-      .attr('text-anchor', 'middle')
-      .style('font-size', '16px')
-      .style('font-weight', 'bold')
-      .text('Model Card Length by Family Generation');
-
-  }, [activePlot, data, width, height, familyTreeData]);
-
-  // Plot 5: Growth Timeline
-  useEffect(() => {
-    if (activePlot !== 'growth-timeline' || !growthTimelineRef.current) return;
-
-    const svg = d3.select(growthTimelineRef.current);
-    svg.selectAll('*').remove();
-
-    const margin = { top: 40, right: 40, bottom: 60, left: 60 };
-    const innerWidth = width - margin.left - margin.right;
-    const innerHeight = height - margin.top - margin.bottom;
-
-    // Fetch growth data from model tracker API
-    fetch(`${API_BASE}/api/model-count/historical?days=365`)
-      .then(res => res.json())
-      .then(data => {
-        if (!data.counts || data.counts.length === 0) {
-          svg.append('text')
-            .attr('x', width / 2)
-            .attr('y', height / 2)
-            .attr('text-anchor', 'middle')
-            .text('No historical data available');
-          return;
-        }
-
-        const g = svg.append('g')
-          .attr('transform', `translate(${margin.left},${margin.top})`);
-
-        const counts = data.counts.map((d: any) => ({
-          date: new Date(d.timestamp),
-          count: d.total_models
-        })).sort((a: any, b: any) => a.date - b.date);
-
-        const extent = d3.extent(counts, (d: any) => d.date) as [Date | undefined, Date | undefined];
-        const minDate = extent[0];
-        const maxDate = extent[1];
-        if (!minDate || !maxDate) return;
-        
-        const xScale = d3.scaleTime()
-          .domain([minDate, maxDate])
-          .range([0, innerWidth]);
-
-        const yScale = d3.scaleLinear()
-          .domain([0, d3.max(counts, (d: any) => d.count) || 0] as [number, number])
-          .range([innerHeight, 0])
-          .nice();
-
-        const line = d3.line<any>()
-          .x(d => xScale(d.date))
-          .y(d => yScale(d.count))
-          .curve(d3.curveMonotoneX);
-
-        g.append('path')
-          .datum(counts)
-          .attr('fill', 'none')
-          .attr('stroke', '#4a90e2')
-          .attr('stroke-width', 2)
-          .attr('d', line);
-
-        g.selectAll('circle')
-          .data(counts)
-          .enter()
-          .append('circle')
-          .attr('cx', (d: any) => xScale(d.date))
-          .attr('cy', (d: any) => yScale(d.count))
-          .attr('r', 3)
-          .attr('fill', '#4a90e2')
-          .on('mouseover', function(event, d: any) {
-            d3.select(this).attr('r', 5);
-            const tooltip = d3.select('body').append('div')
-              .attr('class', 'plot-tooltip')
-              .style('opacity', 0);
-            tooltip.transition().duration(200).style('opacity', 0.9);
-            tooltip.html(`${d.date.toLocaleDateString()}<br/>Models: ${d.count.toLocaleString()}`)
-              .style('left', (event.pageX + 10) + 'px')
-              .style('top', (event.pageY - 28) + 'px');
-          })
-          .on('mouseout', function() {
-            d3.select(this).attr('r', 3);
-            d3.selectAll('.plot-tooltip').remove();
-          });
-
-        const xAxis = d3.axisBottom(xScale).ticks(6);
-        const yAxis = d3.axisLeft(yScale).tickFormat(d3.format('.2s'));
-
-        g.append('g')
-          .attr('transform', `translate(0,${innerHeight})`)
-          .call(xAxis)
-          .append('text')
-          .attr('x', innerWidth / 2)
-          .attr('y', 45)
-          .attr('fill', 'currentColor')
-          .style('text-anchor', 'middle')
-          .style('font-size', '14px')
-          .text('Date');
-
-        g.append('g').call(yAxis)
-          .append('text')
-          .attr('transform', 'rotate(-90)')
-          .attr('y', -45)
-          .attr('x', -innerHeight / 2)
-          .attr('fill', 'currentColor')
-          .style('text-anchor', 'middle')
-          .style('font-size', '14px')
-          .text('Total Models');
-
-        svg.append('text')
-          .attr('x', width / 2)
-          .attr('y', 20)
-          .attr('text-anchor', 'middle')
-          .style('font-size', '16px')
-          .style('font-weight', 'bold')
-          .text('Model Count Growth Over Time');
-      })
-      .catch(err => {
-        console.error('Error fetching growth data:', err);
-        svg.append('text')
-          .attr('x', width / 2)
-          .attr('y', height / 2)
-          .attr('text-anchor', 'middle')
-          .text('Error loading growth data');
-      });
-
-  }, [activePlot, width, height]);
-
-  const plotOptions: { value: PlotType; label: string; description: string }[] = [
-    { value: 'family-size', label: 'Family Size Distribution', description: 'Distribution of family tree sizes' },
-    { value: 'similarity-comparison', label: 'Similarity Comparison', description: 'Sibling vs parent-child similarity' },
-    { value: 'license-drift', label: 'License Drift', description: 'License changes across generations' },
-    { value: 'model-card-length', label: 'Model Card Length', description: 'Model card length by generation' },
-    { value: 'growth-timeline', label: 'Growth Timeline', description: 'Model count over time' },
-  ];
-
-  return (
-    <div className="paper-plots">
-      <div className="plot-selector">
-        <h3>Paper Visualizations</h3>
-        <div className="plot-buttons">
-          {plotOptions.map(option => (
-            <button
-              key={option.value}
-              className={`plot-button ${activePlot === option.value ? 'active' : ''}`}
-              onClick={() => setActivePlot(option.value)}
-              title={option.description}
-            >
-              {option.label}
-            </button>
-          ))}
-        </div>
-      </div>
-
-      <div className="plot-container">
-        {loading && <div className="plot-loading">Loading data...</div>}
-        <svg
-          ref={familySizeRef}
-          width={width}
-          height={height}
-          style={{ display: activePlot === 'family-size' ? 'block' : 'none' }}
-        />
-        <svg
-          ref={similarityRef}
-          width={width}
-          height={height}
-          style={{ display: activePlot === 'similarity-comparison' ? 'block' : 'none' }}
-        />
-        <svg
-          ref={licenseDriftRef}
-          width={width}
-          height={height}
-          style={{ display: activePlot === 'license-drift' ? 'block' : 'none' }}
-        />
-        <svg
-          ref={modelCardLengthRef}
-          width={width}
-          height={height}
-          style={{ display: activePlot === 'model-card-length' ? 'block' : 'none' }}
-        />
-        <svg
-          ref={growthTimelineRef}
-          width={width}
-          height={height}
-          style={{ display: activePlot === 'growth-timeline' ? 'block' : 'none' }}
-        />
-      </div>
-    </div>
-  );
-}
-
diff --git a/frontend/src/components/ScatterPlot.tsx b/frontend/src/components/ScatterPlot.tsx
deleted file mode 100644
index 3f7de64d73764ec24355952471f2623f3aec52cd..0000000000000000000000000000000000000000
--- a/frontend/src/components/ScatterPlot.tsx
+++ /dev/null
@@ -1,7 +0,0 @@
-/**
- * Legacy Visx scatter plot - kept for reference.
- * Use EnhancedScatterPlot.tsx for D3.js implementation.
- */
-// This file is kept for compatibility but EnhancedScatterPlot is preferred
-
-export { default } from './EnhancedScatterPlot';
diff --git a/frontend/src/components/controls/ClusterFilter.css b/frontend/src/components/controls/ClusterFilter.css
new file mode 100644
index 0000000000000000000000000000000000000000..0c489dd43fb7dc3669c450018155afe554a8a96e
--- /dev/null
+++ b/frontend/src/components/controls/ClusterFilter.css
@@ -0,0 +1,122 @@
+.cluster-filter {
+  margin-bottom: 1.5rem;
+}
+
+.cluster-filter-header {
+  margin-bottom: 0.75rem;
+}
+
+.cluster-filter-header h3 {
+  margin: 0;
+  font-size: 1rem;
+  font-weight: 600;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.cluster-filter-search {
+  margin-bottom: 0.75rem;
+}
+
+.cluster-search-input {
+  width: 100%;
+  padding: 0.5rem;
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 4px;
+  font-size: 0.9rem;
+  background: var(--bg-primary, #ffffff);
+  color: var(--text-primary, #1a1a1a);
+}
+
+.cluster-search-input:focus {
+  outline: none;
+  border-color: var(--accent-color, #4a90e2);
+}
+
+.cluster-filter-actions {
+  display: flex;
+  gap: 0.5rem;
+  margin-bottom: 0.75rem;
+}
+
+.cluster-action-btn {
+  flex: 1;
+  padding: 0.4rem 0.6rem;
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 4px;
+  background: var(--bg-primary, #ffffff);
+  color: var(--text-primary, #1a1a1a);
+  font-size: 0.85rem;
+  cursor: pointer;
+  transition: all 0.2s;
+}
+
+.cluster-action-btn:hover:not(:disabled) {
+  background: var(--bg-secondary, #f5f5f5);
+  border-color: var(--accent-color, #4a90e2);
+}
+
+.cluster-action-btn:disabled {
+  opacity: 0.5;
+  cursor: not-allowed;
+}
+
+.cluster-list {
+  max-height: 300px;
+  overflow-y: auto;
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 4px;
+  padding: 0.5rem;
+  background: var(--bg-primary, #ffffff);
+}
+
+.cluster-item {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  padding: 0.5rem;
+  cursor: pointer;
+  border-radius: 3px;
+  transition: background 0.15s;
+  font-size: 0.85rem;
+}
+
+.cluster-item:hover {
+  background: var(--bg-secondary, #f5f5f5);
+}
+
+.cluster-item.selected {
+  background: var(--bg-secondary, #f5f5f5);
+}
+
+.cluster-checkbox {
+  margin: 0;
+  cursor: pointer;
+}
+
+.cluster-color-indicator {
+  width: 12px;
+  height: 12px;
+  border-radius: 2px;
+  flex-shrink: 0;
+  border: 1px solid var(--border-color, #e0e0e0);
+}
+
+.cluster-label {
+  flex: 1;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.cluster-count {
+  font-size: 0.75rem;
+  color: var(--text-secondary, #666);
+  margin-left: auto;
+}
+
+.cluster-filter-loading,
+.cluster-filter-empty {
+  padding: 1rem;
+  text-align: center;
+  color: var(--text-secondary, #666);
+  font-size: 0.9rem;
+}
+
diff --git a/frontend/src/components/controls/ClusterFilter.tsx b/frontend/src/components/controls/ClusterFilter.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..f2ccc4d3528cf6abbfd2b18ae34bcec4037abf9b
--- /dev/null
+++ b/frontend/src/components/controls/ClusterFilter.tsx
@@ -0,0 +1,142 @@
+/**
+ * Enhanced cluster filter component with search, Select All/Clear All/Random buttons.
+ * Inspired by LAION's cluster filtering UI.
+ */
+import React, { useState, useMemo } from 'react';
+import { useFilterStore } from '../../stores/filterStore';
+import './ClusterFilter.css';
+
+export interface Cluster {
+  cluster_id: number;
+  cluster_label: string;
+  count: number;
+  color?: string;
+}
+
+interface ClusterFilterProps {
+  clusters: Cluster[];
+  loading?: boolean;
+}
+
+export default function ClusterFilter({ clusters, loading = false }: ClusterFilterProps) {
+  const { selectedClusters, setSelectedClusters } = useFilterStore();
+  const [searchTerm, setSearchTerm] = useState('');
+
+  const filteredClusters = useMemo(() => {
+    if (!searchTerm) return clusters;
+    const lowerSearch = searchTerm.toLowerCase();
+    return clusters.filter(c => 
+      c.cluster_label.toLowerCase().includes(lowerSearch) ||
+      c.cluster_id.toString().includes(lowerSearch)
+    );
+  }, [clusters, searchTerm]);
+
+  const handleSelectAll = () => {
+    setSelectedClusters(clusters.map(c => c.cluster_id));
+  };
+
+  const handleClearAll = () => {
+    setSelectedClusters([]);
+  };
+
+  const handleRandom = () => {
+    if (clusters.length === 0) return;
+    const randomCluster = clusters[Math.floor(Math.random() * clusters.length)];
+    setSelectedClusters([randomCluster.cluster_id]);
+  };
+
+  const handleToggleCluster = (clusterId: number) => {
+    if (selectedClusters.includes(clusterId)) {
+      setSelectedClusters(selectedClusters.filter(id => id !== clusterId));
+    } else {
+      setSelectedClusters([...selectedClusters, clusterId]);
+    }
+  };
+
+  if (loading) {
+    return (
+      <div className="cluster-filter">
+        <div className="cluster-filter-loading">Loading clusters...</div>
+      </div>
+    );
+  }
+
+  if (clusters.length === 0) {
+    return (
+      <div className="cluster-filter">
+        <div className="cluster-filter-empty">No clusters available</div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="cluster-filter">
+      <div className="cluster-filter-header">
+        <h3>Dataset Clusters</h3>
+      </div>
+      
+      <div className="cluster-filter-search">
+        <input
+          type="text"
+          placeholder={`Search ${clusters.length} clusters...`}
+          value={searchTerm}
+          onChange={(e) => setSearchTerm(e.target.value)}
+          className="cluster-search-input"
+        />
+      </div>
+
+      <div className="cluster-filter-actions">
+        <button
+          onClick={handleSelectAll}
+          className="cluster-action-btn"
+          disabled={clusters.length === 0}
+        >
+          Select All
+        </button>
+        <button
+          onClick={handleClearAll}
+          className="cluster-action-btn"
+          disabled={selectedClusters.length === 0}
+        >
+          Clear All
+        </button>
+        <button
+          onClick={handleRandom}
+          className="cluster-action-btn"
+          disabled={clusters.length === 0}
+        >
+          Random
+        </button>
+      </div>
+
+      <div className="cluster-list">
+        {filteredClusters.length === 0 ? (
+          <div className="cluster-filter-empty">No clusters match your search</div>
+        ) : (
+          filteredClusters.map(cluster => (
+            <label
+              key={cluster.cluster_id}
+              className={`cluster-item ${selectedClusters.includes(cluster.cluster_id) ? 'selected' : ''}`}
+            >
+              <input
+                type="checkbox"
+                checked={selectedClusters.includes(cluster.cluster_id)}
+                onChange={() => handleToggleCluster(cluster.cluster_id)}
+                className="cluster-checkbox"
+              />
+              {cluster.color && (
+                <span
+                  className="cluster-color-indicator"
+                  style={{ backgroundColor: cluster.color }}
+                />
+              )}
+              <span className="cluster-label">{cluster.cluster_label}</span>
+              <span className="cluster-count">({cluster.count.toLocaleString()})</span>
+            </label>
+          ))
+        )}
+      </div>
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/controls/NodeDensitySlider.css b/frontend/src/components/controls/NodeDensitySlider.css
new file mode 100644
index 0000000000000000000000000000000000000000..a07cd3b5d24c954fd4e1a9883d6c83fe8072c2f3
--- /dev/null
+++ b/frontend/src/components/controls/NodeDensitySlider.css
@@ -0,0 +1,31 @@
+.node-density-slider {
+  margin-bottom: 1rem;
+}
+
+.node-density-label {
+  display: block;
+}
+
+.node-density-title {
+  font-weight: 500;
+  display: block;
+  margin-bottom: 0.5rem;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.node-density-input {
+  width: 100%;
+  cursor: pointer;
+}
+
+.node-density-input:disabled {
+  opacity: 0.5;
+  cursor: not-allowed;
+}
+
+.node-density-hint {
+  font-size: 0.75rem;
+  color: var(--text-secondary, #666);
+  margin-top: 0.25rem;
+}
+
diff --git a/frontend/src/components/controls/NodeDensitySlider.tsx b/frontend/src/components/controls/NodeDensitySlider.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..5e6db8dfdffe969c9f06035c78792d226521406c
--- /dev/null
+++ b/frontend/src/components/controls/NodeDensitySlider.tsx
@@ -0,0 +1,39 @@
+/**
+ * Node density slider for controlling rendering performance.
+ * Lower density improves performance for large datasets.
+ */
+import React from 'react';
+import { useFilterStore } from '../../stores/filterStore';
+import './NodeDensitySlider.css';
+
+interface NodeDensitySliderProps {
+  disabled?: boolean;
+}
+
+export default function NodeDensitySlider({ disabled = false }: NodeDensitySliderProps) {
+  const { nodeDensity, setNodeDensity } = useFilterStore();
+
+  return (
+    <div className="node-density-slider">
+      <label className="node-density-label">
+        <span className="node-density-title">
+          Node Density ({nodeDensity}%)
+        </span>
+        <input
+          type="range"
+          min="10"
+          max="100"
+          step="10"
+          value={nodeDensity}
+          onChange={(e) => setNodeDensity(parseInt(e.target.value))}
+          disabled={disabled}
+          className="node-density-input"
+        />
+        <div className="node-density-hint">
+          Lower density improves performance for large datasets
+        </div>
+      </label>
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/controls/RandomModelButton.tsx b/frontend/src/components/controls/RandomModelButton.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..79817bcfa6b1cd2b362db5a53db22e28c0ee6185
--- /dev/null
+++ b/frontend/src/components/controls/RandomModelButton.tsx
@@ -0,0 +1,32 @@
+/**
+ * Button to select a random model from the dataset for discovery.
+ */
+import React from 'react';
+import { ModelPoint } from '../../types';
+
+interface RandomModelButtonProps {
+  data: ModelPoint[];
+  onSelect: (model: ModelPoint) => void;
+  disabled?: boolean;
+}
+
+export default function RandomModelButton({ data, onSelect, disabled }: RandomModelButtonProps) {
+  const handleRandomSelect = () => {
+    if (data.length === 0) return;
+    const randomIndex = Math.floor(Math.random() * data.length);
+    onSelect(data[randomIndex]);
+  };
+
+  return (
+    <button
+      onClick={handleRandomSelect}
+      disabled={disabled || data.length === 0}
+      className="random-model-btn"
+      title="Select a random model"
+      aria-label="Select random model"
+    >
+      <span>Select Random Model</span>
+    </button>
+  );
+}
+
diff --git a/frontend/src/components/controls/RenderingStyleSelector.css b/frontend/src/components/controls/RenderingStyleSelector.css
new file mode 100644
index 0000000000000000000000000000000000000000..6fb1a397ca6c732dd3286b3b4001ca2b1368fbcd
--- /dev/null
+++ b/frontend/src/components/controls/RenderingStyleSelector.css
@@ -0,0 +1,37 @@
+.rendering-style-selector {
+  margin-bottom: 1rem;
+}
+
+.rendering-style-label {
+  display: block;
+}
+
+.rendering-style-title {
+  font-weight: 500;
+  display: block;
+  margin-bottom: 0.5rem;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.rendering-style-select {
+  width: 100%;
+  padding: 0.5rem;
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 4px;
+  background: var(--bg-primary, #ffffff);
+  color: var(--text-primary, #1a1a1a);
+  font-size: 0.9rem;
+  cursor: pointer;
+}
+
+.rendering-style-select:focus {
+  outline: none;
+  border-color: var(--accent-color, #4a90e2);
+}
+
+.rendering-style-hint {
+  font-size: 0.75rem;
+  color: var(--text-secondary, #666);
+  margin-top: 0.25rem;
+}
+
diff --git a/frontend/src/components/controls/RenderingStyleSelector.tsx b/frontend/src/components/controls/RenderingStyleSelector.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..1153947ce969e6f49a545135b634ffcfac2a95ee
--- /dev/null
+++ b/frontend/src/components/controls/RenderingStyleSelector.tsx
@@ -0,0 +1,43 @@
+/**
+ * Rendering style selector dropdown.
+ * Allows users to choose different 3D layout/geometry styles.
+ */
+import React from 'react';
+import { useFilterStore, RenderingStyle } from '../../stores/filterStore';
+import './RenderingStyleSelector.css';
+
+const STYLES: { value: RenderingStyle; label: string; description: string }[] = [
+  { value: 'embeddings', label: 'Embeddings', description: 'Standard embedding-based layout' },
+  { value: 'sphere', label: 'Sphere', description: 'Spherical arrangement of points' },
+  { value: 'galaxy', label: 'Galaxy', description: 'Spiral galaxy-like layout' },
+  { value: 'wave', label: 'Wave', description: 'Wave pattern arrangement' },
+  { value: 'helix', label: 'Helix', description: 'Helical/spiral arrangement' },
+  { value: 'torus', label: 'Torus', description: 'Torus/donut-shaped layout' },
+];
+
+export default function RenderingStyleSelector() {
+  const { renderingStyle, setRenderingStyle } = useFilterStore();
+
+  return (
+    <div className="rendering-style-selector">
+      <label className="rendering-style-label">
+        <span className="rendering-style-title">Rendering Style</span>
+        <select
+          value={renderingStyle}
+          onChange={(e) => setRenderingStyle(e.target.value as RenderingStyle)}
+          className="rendering-style-select"
+        >
+          {STYLES.map(style => (
+            <option key={style.value} value={style.value}>
+              {style.label}
+            </option>
+          ))}
+        </select>
+        <div className="rendering-style-hint">
+          {STYLES.find(s => s.value === renderingStyle)?.description}
+        </div>
+      </label>
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/controls/ThemeToggle.tsx b/frontend/src/components/controls/ThemeToggle.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..b842fdd2a2c0f0bb24f0010f9c0a9e489ddbffc7
--- /dev/null
+++ b/frontend/src/components/controls/ThemeToggle.tsx
@@ -0,0 +1,22 @@
+/**
+ * Toggle button for switching between light and dark themes.
+ */
+import React from 'react';
+import { useFilterStore } from '../../stores/filterStore';
+
+export default function ThemeToggle() {
+  const theme = useFilterStore((state) => state.theme);
+  const toggleTheme = useFilterStore((state) => state.toggleTheme);
+
+  return (
+    <button
+      onClick={toggleTheme}
+      className="theme-toggle"
+      title={`Switch to ${theme === 'light' ? 'dark' : 'light'} mode`}
+      aria-label={`Current theme: ${theme}. Click to switch to ${theme === 'light' ? 'dark' : 'light'} mode`}
+    >
+      {theme === 'light' ? '🌙' : '☀️'}
+    </button>
+  );
+}
+
diff --git a/frontend/src/components/controls/VisualizationModeButtons.css b/frontend/src/components/controls/VisualizationModeButtons.css
new file mode 100644
index 0000000000000000000000000000000000000000..e279c082997e23bcfd83b71a1ce67924130bbf5f
--- /dev/null
+++ b/frontend/src/components/controls/VisualizationModeButtons.css
@@ -0,0 +1,65 @@
+.visualization-mode-buttons {
+  position: sticky;
+  top: 0;
+  z-index: 100;
+  background: var(--bg-primary, #ffffff);
+  border-bottom: 1px solid var(--border-color, #e0e0e0);
+  padding: 0.75rem 1rem;
+  margin-bottom: 1rem;
+}
+
+.mode-buttons-container {
+  display: flex;
+  gap: 0.5rem;
+  flex-wrap: wrap;
+  justify-content: center;
+}
+
+.mode-button {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  padding: 0.5rem 1rem;
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 6px;
+  background: var(--bg-primary, #ffffff);
+  color: var(--text-primary, #1a1a1a);
+  font-size: 0.9rem;
+  cursor: pointer;
+  transition: all 0.2s;
+}
+
+.mode-button:hover {
+  background: var(--bg-secondary, #f5f5f5);
+  border-color: var(--accent-color, #4a90e2);
+}
+
+.mode-button.active {
+  background: var(--accent-color, #4a90e2);
+  color: white;
+  border-color: var(--accent-color, #4a90e2);
+}
+
+.mode-icon {
+  font-size: 1.1rem;
+}
+
+.mode-label {
+  font-weight: 500;
+}
+
+@media (max-width: 768px) {
+  .mode-buttons-container {
+    gap: 0.25rem;
+  }
+  
+  .mode-button {
+    padding: 0.4rem 0.6rem;
+    font-size: 0.8rem;
+  }
+  
+  .mode-label {
+    display: none;
+  }
+}
+
diff --git a/frontend/src/components/controls/VisualizationModeButtons.tsx b/frontend/src/components/controls/VisualizationModeButtons.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..4e639d7f903d60cf4c02b47fe8ae287e7c068c15
--- /dev/null
+++ b/frontend/src/components/controls/VisualizationModeButtons.tsx
@@ -0,0 +1,46 @@
+/**
+ * Visualization mode buttons with sticky header.
+ * Inspired by LAION's mode selection UI.
+ */
+import React from 'react';
+import { useFilterStore, ViewMode } from '../../stores/filterStore';
+import './VisualizationModeButtons.css';
+
+interface ModeOption {
+  value: ViewMode;
+  label: string;
+  icon: string;
+  description: string;
+}
+
+const MODES: ModeOption[] = [
+  { value: '3d', label: '3D Embedding', icon: '🎯', description: 'Interactive 3D exploration' },
+  { value: 'scatter', label: '2D Scatter', icon: '📊', description: '2D projection view' },
+  { value: 'network', label: 'Network', icon: '🕸️', description: 'Network graph view' },
+  { value: 'distribution', label: 'Distribution', icon: '📈', description: 'Statistical distributions' },
+  { value: 'stacked', label: 'Stacked', icon: '📚', description: 'Hierarchical view' },
+  { value: 'heatmap', label: 'Heatmap', icon: '🔥', description: 'Density heatmap' },
+];
+
+export default function VisualizationModeButtons() {
+  const { viewMode, setViewMode } = useFilterStore();
+
+  return (
+    <div className="visualization-mode-buttons">
+      <div className="mode-buttons-container">
+        {MODES.map(mode => (
+          <button
+            key={mode.value}
+            className={`mode-button ${viewMode === mode.value ? 'active' : ''}`}
+            onClick={() => setViewMode(mode.value)}
+            title={mode.description}
+          >
+            <span className="mode-icon">{mode.icon}</span>
+            <span className="mode-label">{mode.label}</span>
+          </button>
+        ))}
+      </div>
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/controls/ZoomSlider.tsx b/frontend/src/components/controls/ZoomSlider.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..2eb0c85eed222b2923bb0124113567c2b1761c51
--- /dev/null
+++ b/frontend/src/components/controls/ZoomSlider.tsx
@@ -0,0 +1,43 @@
+/**
+ * Slider control for zoom level in 3D visualization.
+ */
+import React from 'react';
+
+interface ZoomSliderProps {
+  value: number;
+  onChange: (value: number) => void;
+  min?: number;
+  max?: number;
+  step?: number;
+  disabled?: boolean;
+}
+
+export default function ZoomSlider({
+  value,
+  onChange,
+  min = 0.1,
+  max = 5,
+  step = 0.1,
+  disabled = false,
+}: ZoomSliderProps) {
+  return (
+    <div className="zoom-slider-container">
+      <label className="zoom-slider-label">
+        <span>Zoom Level</span>
+        <span className="zoom-value">{value.toFixed(1)}x</span>
+      </label>
+      <input
+        type="range"
+        min={min}
+        max={max}
+        step={step}
+        value={value}
+        onChange={(e) => onChange(parseFloat(e.target.value))}
+        disabled={disabled}
+        className="zoom-slider"
+        aria-label="Zoom level"
+      />
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/layout/SearchBar.css b/frontend/src/components/layout/SearchBar.css
new file mode 100644
index 0000000000000000000000000000000000000000..b3ae2d1d3f157ea78d2c9aefeea136898f9a2802
--- /dev/null
+++ b/frontend/src/components/layout/SearchBar.css
@@ -0,0 +1,181 @@
+.search-bar-container {
+  position: relative;
+  width: 100%;
+  max-width: 600px;
+  z-index: 1000;
+}
+
+.search-bar {
+  position: relative;
+  display: flex;
+  align-items: center;
+  background: white;
+  border: 2px solid #e0e0e0;
+  border-radius: 8px;
+  padding: 8px 12px;
+  transition: border-color 0.2s;
+}
+
+.search-bar:focus-within {
+  border-color: #4a90e2;
+  box-shadow: 0 0 0 3px rgba(74, 144, 226, 0.1);
+}
+
+.search-input {
+  flex: 1;
+  border: none;
+  outline: none;
+  font-size: 14px;
+  font-family: 'Instrument Sans', sans-serif;
+  color: #333;
+  background: transparent;
+}
+
+.search-input::placeholder {
+  color: #999;
+}
+
+.search-loading {
+  margin-left: 8px;
+  color: #4a90e2;
+  animation: spin 1s linear infinite;
+  font-size: 16px;
+}
+
+.search-clear {
+  margin-left: 8px;
+  background: none;
+  border: none;
+  color: #999;
+  cursor: pointer;
+  font-size: 20px;
+  line-height: 1;
+  padding: 0;
+  width: 20px;
+  height: 20px;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  transition: color 0.2s;
+}
+
+.search-clear:hover {
+  color: #333;
+}
+
+.search-results {
+  position: absolute;
+  top: 100%;
+  left: 0;
+  right: 0;
+  margin-top: 4px;
+  background: white;
+  border: 1px solid #e0e0e0;
+  border-radius: 8px;
+  box-shadow: 0 4px 12px rgba(0, 0, 0, 0.15);
+  max-height: 400px;
+  overflow-y: auto;
+  z-index: 1001;
+}
+
+.search-result {
+  padding: 12px;
+  cursor: pointer;
+  border-bottom: 1px solid #f0f0f0;
+  transition: background-color 0.15s;
+}
+
+.search-result:last-child {
+  border-bottom: none;
+}
+
+.search-result:hover,
+.search-result.selected {
+  background-color: #f5f5f5;
+}
+
+.result-header {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  margin-bottom: 6px;
+}
+
+.result-model-id {
+  font-size: 14px;
+  font-weight: 600;
+  color: #333;
+  font-family: 'Instrument Sans', sans-serif;
+}
+
+.result-org {
+  font-size: 12px;
+  color: #666;
+  background: #f0f0f0;
+  padding: 2px 6px;
+  border-radius: 4px;
+}
+
+.result-meta {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 6px;
+  margin-bottom: 4px;
+}
+
+.result-tag {
+  font-size: 11px;
+  color: #666;
+  background: #e8e8e8;
+  padding: 2px 6px;
+  border-radius: 3px;
+}
+
+.result-snippet {
+  font-size: 12px;
+  color: #666;
+  margin-top: 4px;
+  line-height: 1.4;
+}
+
+.result-snippet mark {
+  background: #fff3cd;
+  padding: 1px 2px;
+  border-radius: 2px;
+}
+
+.search-no-results {
+  padding: 16px;
+  text-align: center;
+  color: #999;
+  font-size: 14px;
+}
+
+@keyframes spin {
+  from {
+    transform: rotate(0deg);
+  }
+  to {
+    transform: rotate(360deg);
+  }
+}
+
+/* Scrollbar styling */
+.search-results::-webkit-scrollbar {
+  width: 8px;
+}
+
+.search-results::-webkit-scrollbar-track {
+  background: #f1f1f1;
+  border-radius: 4px;
+}
+
+.search-results::-webkit-scrollbar-thumb {
+  background: #c1c1c1;
+  border-radius: 4px;
+}
+
+.search-results::-webkit-scrollbar-thumb:hover {
+  background: #a8a8a8;
+}
+
diff --git a/frontend/src/components/layout/SearchBar.tsx b/frontend/src/components/layout/SearchBar.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..f2f3509b7a1d79da9d48388e0edf565710846111
--- /dev/null
+++ b/frontend/src/components/layout/SearchBar.tsx
@@ -0,0 +1,201 @@
+/**
+ * Enhanced search bar with autocomplete and keyboard navigation.
+ * Integrates with filter store and triggers map zoom/modal open.
+ */
+import React, { useState, useEffect, useRef, useCallback } from 'react';
+import { useFilterStore } from '../../stores/filterStore';
+import './SearchBar.css';
+
+import { API_BASE } from '../../config/api';
+
+interface SearchResult {
+  model_id: string;
+  x: number;
+  y: number;
+  z: number;
+  org: string;
+  library?: string;
+  pipeline?: string;
+  license?: string;
+  snippet?: string;
+  match_score?: number;
+}
+
+interface SearchBarProps {
+  onSelect?: (result: SearchResult) => void;
+  onZoomTo?: (x: number, y: number, z: number) => void;
+}
+
+export default function SearchBar({ onSelect, onZoomTo }: SearchBarProps) {
+  const [query, setQuery] = useState('');
+  const [results, setResults] = useState<SearchResult[]>([]);
+  const [selectedIndex, setSelectedIndex] = useState(-1);
+  const [isOpen, setIsOpen] = useState(false);
+  const [isLoading, setIsLoading] = useState(false);
+  const inputRef = useRef<HTMLInputElement>(null);
+  const resultsRef = useRef<HTMLDivElement>(null);
+  
+  const setSearchQuery = useFilterStore((state) => state.setSearchQuery);
+  
+  // Debounced search
+  useEffect(() => {
+    if (query.length < 2) {
+      setResults([]);
+      setIsOpen(false);
+      return;
+    }
+    
+    setIsLoading(true);
+    const timer = setTimeout(async () => {
+      try {
+        const response = await fetch(
+          `${API_BASE}/api/search?q=${encodeURIComponent(query)}&limit=20`
+        );
+        if (!response.ok) throw new Error('Search failed');
+        const data = await response.json();
+        setResults(data.results || []);
+        setIsOpen(true);
+        setSelectedIndex(-1);
+      } catch (err) {
+        console.error('Search error:', err);
+        setResults([]);
+      } finally {
+        setIsLoading(false);
+      }
+    }, 150);
+    
+    return () => clearTimeout(timer);
+  }, [query]);
+  
+  const handleSelect = useCallback((result: SearchResult) => {
+    setSearchQuery(result.model_id);
+    
+    // Trigger zoom if coordinates available
+    if (onZoomTo && result.x !== undefined && result.y !== undefined) {
+      onZoomTo(result.x, result.y, result.z || 0);
+    }
+    
+    // Trigger select callback
+    if (onSelect) {
+      onSelect(result);
+    }
+    
+    setIsOpen(false);
+    setQuery('');
+    inputRef.current?.blur();
+  }, [onSelect, onZoomTo, setSearchQuery]);
+  
+  const handleKeyDown = (e: React.KeyboardEvent) => {
+    if (!isOpen || results.length === 0) return;
+    
+    if (e.key === 'ArrowDown') {
+      e.preventDefault();
+      setSelectedIndex(prev => 
+        prev < results.length - 1 ? prev + 1 : prev
+      );
+      // Scroll into view
+      if (resultsRef.current && selectedIndex >= 0) {
+        const selectedElement = resultsRef.current.children[selectedIndex + 1] as HTMLElement;
+        selectedElement?.scrollIntoView({ block: 'nearest' });
+      }
+    } else if (e.key === 'ArrowUp') {
+      e.preventDefault();
+      setSelectedIndex(prev => prev > 0 ? prev - 1 : -1);
+    } else if (e.key === 'Enter') {
+      e.preventDefault();
+      if (selectedIndex >= 0 && results[selectedIndex]) {
+        handleSelect(results[selectedIndex]);
+      } else if (results.length > 0) {
+        handleSelect(results[0]);
+      }
+    } else if (e.key === 'Escape') {
+      setIsOpen(false);
+      inputRef.current?.blur();
+    }
+  };
+  
+  const handleFocus = () => {
+    if (results.length > 0) {
+      setIsOpen(true);
+    }
+  };
+  
+  const handleBlur = (e: React.FocusEvent) => {
+    // Delay to allow click events on results
+    setTimeout(() => {
+      if (!resultsRef.current?.contains(document.activeElement)) {
+        setIsOpen(false);
+      }
+    }, 200);
+  };
+  
+  return (
+    <div className="search-bar-container">
+      <div className="search-bar">
+        <input
+          ref={inputRef}
+          type="text"
+          value={query}
+          onChange={(e) => setQuery(e.target.value)}
+          onKeyDown={handleKeyDown}
+          onFocus={handleFocus}
+          onBlur={handleBlur}
+          placeholder="Search models, orgs, tasks, licenses..."
+          className="search-input"
+          aria-label="Search models"
+          aria-expanded={isOpen}
+          aria-haspopup="listbox"
+        />
+        {isLoading && <div className="search-loading">⟳</div>}
+        {query.length > 0 && !isLoading && (
+          <button
+            className="search-clear"
+            onClick={() => {
+              setQuery('');
+              setResults([]);
+              setIsOpen(false);
+            }}
+            aria-label="Clear search"
+          >
+            ×
+          </button>
+        )}
+      </div>
+      {isOpen && results.length > 0 && (
+        <div ref={resultsRef} className="search-results" role="listbox">
+          {results.map((result, idx) => (
+            <div
+              key={result.model_id}
+              className={`search-result ${idx === selectedIndex ? 'selected' : ''}`}
+              onClick={() => handleSelect(result)}
+              role="option"
+              aria-selected={idx === selectedIndex}
+            >
+              <div className="result-header">
+                <strong className="result-model-id">{result.model_id}</strong>
+                {result.org && <span className="result-org">{result.org}</span>}
+              </div>
+              <div className="result-meta">
+                {result.library && <span className="result-tag">{result.library}</span>}
+                {result.pipeline && <span className="result-tag">{result.pipeline}</span>}
+                {result.license && <span className="result-tag">{result.license}</span>}
+              </div>
+              {result.snippet && (
+                <div 
+                  className="result-snippet" 
+                  dangerouslySetInnerHTML={{ __html: result.snippet }} 
+                />
+              )}
+            </div>
+          ))}
+        </div>
+      )}
+      {isOpen && query.length >= 2 && results.length === 0 && !isLoading && (
+        <div className="search-results">
+          <div className="search-no-results">No results found</div>
+        </div>
+      )}
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/modals/FileTree.css b/frontend/src/components/modals/FileTree.css
new file mode 100644
index 0000000000000000000000000000000000000000..40b3cbdd658b6b006e86a2d101382c32d0013ef4
--- /dev/null
+++ b/frontend/src/components/modals/FileTree.css
@@ -0,0 +1,268 @@
+.file-tree-container {
+  margin-top: 1rem;
+  border: 1px solid #e0e0e0;
+  border-radius: 4px;
+  background: #fafafa;
+  max-height: 600px;
+  overflow-y: auto;
+  overflow-x: hidden;
+  display: flex;
+  flex-direction: column;
+}
+
+.file-tree-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  padding: 0.75rem 1rem;
+  background: #f5f5f5;
+  border-bottom: 1px solid #e0e0e0;
+  font-size: 0.9rem;
+  font-weight: 600;
+  flex-shrink: 0;
+  position: sticky;
+  top: 0;
+  z-index: 10;
+}
+
+.file-count-badge {
+  background: #e3f2fd;
+  color: #1976d2;
+  padding: 0.2rem 0.5rem;
+  border-radius: 12px;
+  font-size: 0.75rem;
+  font-weight: 500;
+}
+
+.file-tree-link {
+  color: #4a90e2;
+  text-decoration: none;
+  font-size: 0.85rem;
+  font-weight: 400;
+  white-space: nowrap;
+}
+
+.file-tree-link:hover {
+  text-decoration: underline;
+}
+
+.file-tree-button {
+  background: #f0f0f0;
+  border: 1px solid #d0d0d0;
+  border-radius: 3px;
+  padding: 0.25rem 0.5rem;
+  font-size: 0.75rem;
+  cursor: pointer;
+  color: #333;
+  font-family: 'Instrument Sans', sans-serif;
+  transition: background 0.15s;
+}
+
+.file-tree-button:hover {
+  background: #e0e0e0;
+}
+
+.file-tree-button:active {
+  background: #d0d0d0;
+}
+
+.file-tree-filters {
+  padding: 0.75rem 1rem;
+  background: #ffffff;
+  border-bottom: 1px solid #e0e0e0;
+  display: flex;
+  gap: 0.75rem;
+  flex-shrink: 0;
+  position: sticky;
+  top: 48px;
+  z-index: 9;
+}
+
+.file-tree-search {
+  flex: 1;
+  position: relative;
+  display: flex;
+  align-items: center;
+}
+
+.file-tree-search-input {
+  width: 100%;
+  padding: 0.5rem 2rem 0.5rem 0.75rem;
+  border: 1px solid #d0d0d0;
+  border-radius: 4px;
+  font-size: 0.85rem;
+  font-family: 'Instrument Sans', sans-serif;
+}
+
+.file-tree-search-input:focus {
+  outline: none;
+  border-color: #4a90e2;
+  box-shadow: 0 0 0 2px rgba(74, 144, 226, 0.1);
+}
+
+.file-tree-clear {
+  position: absolute;
+  right: 0.5rem;
+  background: none;
+  border: none;
+  cursor: pointer;
+  color: #666;
+  font-size: 1rem;
+  padding: 0.25rem;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  border-radius: 2px;
+}
+
+.file-tree-clear:hover {
+  background: #f0f0f0;
+  color: #1a1a1a;
+}
+
+.file-tree-type-filter {
+  padding: 0.5rem 0.75rem;
+  border: 1px solid #d0d0d0;
+  border-radius: 4px;
+  font-size: 0.85rem;
+  font-family: 'Instrument Sans', sans-serif;
+  background: white;
+  cursor: pointer;
+  min-width: 150px;
+}
+
+.file-tree-type-filter:focus {
+  outline: none;
+  border-color: #4a90e2;
+  box-shadow: 0 0 0 2px rgba(74, 144, 226, 0.1);
+}
+
+.file-tree {
+  padding: 0.5rem;
+  font-family: 'Monaco', 'Menlo', 'Ubuntu Mono', monospace;
+  font-size: 0.85rem;
+  flex: 1;
+  overflow-y: auto;
+}
+
+.file-tree-node {
+  margin: 0.125rem 0;
+}
+
+.file-tree-item {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  padding: 0.375rem 0.5rem;
+  border-radius: 3px;
+  transition: background 0.15s;
+  user-select: none;
+}
+
+.file-tree-item.directory {
+  cursor: pointer;
+}
+
+.file-tree-item.directory:hover {
+  background: #e8f4f8;
+}
+
+.file-tree-item.file:hover {
+  background: #f0f0f0;
+}
+
+.file-actions {
+  display: flex;
+  gap: 0.25rem;
+  margin-left: auto;
+  opacity: 0;
+  transition: opacity 0.2s;
+}
+
+.file-tree-item:hover .file-actions {
+  opacity: 1;
+}
+
+.file-action-btn {
+  background: none;
+  border: none;
+  cursor: pointer;
+  font-size: 0.9rem;
+  padding: 0.25rem;
+  border-radius: 2px;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  transition: background 0.15s;
+  text-decoration: none;
+  color: inherit;
+}
+
+.file-action-btn:hover {
+  background: rgba(0, 0, 0, 0.1);
+}
+
+.file-icon {
+  font-size: 1rem;
+  width: 1.25rem;
+  text-align: center;
+}
+
+.file-name {
+  flex: 1;
+  color: #1a1a1a;
+  word-break: break-all;
+}
+
+.file-size {
+  color: #666;
+  font-size: 0.8rem;
+  margin-left: auto;
+}
+
+.file-expand {
+  color: #666;
+  font-size: 0.7rem;
+  width: 0.75rem;
+  text-align: center;
+}
+
+.file-tree-children {
+  margin-left: 0.5rem;
+  border-left: 1px solid #e8e8e8;
+  padding-left: 0.5rem;
+  margin-top: 0.125rem;
+}
+
+.file-tree-loading,
+.file-tree-error,
+.file-tree-empty {
+  padding: 1rem;
+  text-align: center;
+  color: #666;
+  font-size: 0.9rem;
+}
+
+.file-tree-error {
+  color: #d32f2f;
+}
+
+/* Scrollbar styling */
+.file-tree-container::-webkit-scrollbar {
+  width: 8px;
+}
+
+.file-tree-container::-webkit-scrollbar-track {
+  background: #f1f1f1;
+  border-radius: 4px;
+}
+
+.file-tree-container::-webkit-scrollbar-thumb {
+  background: #c1c1c1;
+  border-radius: 4px;
+}
+
+.file-tree-container::-webkit-scrollbar-thumb:hover {
+  background: #a8a8a8;
+}
+
diff --git a/frontend/src/components/modals/FileTree.tsx b/frontend/src/components/modals/FileTree.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..5cd739cc334b29e05a48deb9573562852d702c1d
--- /dev/null
+++ b/frontend/src/components/modals/FileTree.tsx
@@ -0,0 +1,509 @@
+/**
+ * File tree component for displaying model file structure.
+ * Fetches and displays files from Hugging Face model repository.
+ */
+import React, { useState, useEffect, useMemo } from 'react';
+import { getHuggingFaceFileTreeUrl } from '../../utils/api/hfUrl';
+import './FileTree.css';
+
+import { API_BASE } from '../../config/api';
+
+interface FileNode {
+  path: string;
+  type: 'file' | 'directory';
+  size?: number;
+  children?: FileNode[];
+}
+
+interface FileTreeProps {
+  modelId: string;
+}
+
+export default function FileTree({ modelId }: FileTreeProps) {
+  const [files, setFiles] = useState<FileNode[]>([]);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState<string | null>(null);
+  const [expandedPaths, setExpandedPaths] = useState<Set<string>>(new Set());
+  const [searchQuery, setSearchQuery] = useState('');
+  const [fileTypeFilter, setFileTypeFilter] = useState<string>('all');
+  const [showSearch, setShowSearch] = useState(false);
+  const searchInputRef = React.useRef<HTMLInputElement>(null);
+
+  useEffect(() => {
+    if (!modelId) {
+      setLoading(false);
+      setError('No model ID provided');
+      return;
+    }
+
+    const fetchFiles = async () => {
+      setLoading(true);
+      setError(null);
+      try {
+        const response = await fetch(
+          `${API_BASE}/api/model/${encodeURIComponent(modelId)}/files?branch=main`
+        );
+
+        if (response.status === 404) {
+          throw new Error('File tree not available for this model');
+        }
+        
+        if (response.status === 503) {
+          throw new Error('Backend service unavailable');
+        }
+
+        if (!response.ok) {
+          const errorText = await response.text();
+          throw new Error(`Failed to load file tree: ${response.status} ${errorText}`);
+        }
+
+        const data = await response.json();
+        
+        if (!Array.isArray(data)) {
+          throw new Error('Invalid response format');
+        }
+        
+        // Convert flat list to tree structure
+        const tree = buildFileTree(data);
+        setFiles(tree);
+      } catch (err: any) {
+        const errorMessage = err instanceof Error ? err.message : 'Failed to load files';
+        setError(errorMessage);
+        // Only log in development
+        if (process.env.NODE_ENV === 'development') {
+          console.error('Error fetching file tree:', err);
+        }
+      } finally {
+        setLoading(false);
+      }
+    };
+
+    fetchFiles();
+  }, [modelId]);
+
+  const buildFileTree = (fileList: any[]): FileNode[] => {
+    if (!Array.isArray(fileList) || fileList.length === 0) {
+      return [];
+    }
+
+    const tree: FileNode[] = [];
+    const pathMap = new Map<string, FileNode>();
+
+    // Sort files by path for consistent ordering
+    const sortedFiles = [...fileList].sort((a, b) => {
+      const pathA = a.path || '';
+      const pathB = b.path || '';
+      return pathA.localeCompare(pathB);
+    });
+
+    for (const file of sortedFiles) {
+      if (!file.path) continue;
+
+      const parts = file.path.split('/').filter((p: string) => p.length > 0);
+      if (parts.length === 0) continue;
+
+      let currentPath = '';
+      let parent: FileNode | null = null;
+
+      for (let i = 0; i < parts.length; i++) {
+        const part = parts[i];
+        currentPath = currentPath ? `${currentPath}/${part}` : part;
+
+        if (!pathMap.has(currentPath)) {
+          const isDirectory = i < parts.length - 1;
+          const node: FileNode = {
+            path: currentPath,
+            type: isDirectory ? 'directory' : 'file',
+            size: isDirectory ? undefined : (file.size || undefined), // Only set size for files
+            children: isDirectory ? [] : undefined,
+          };
+
+          pathMap.set(currentPath, node);
+
+          if (parent) {
+            parent.children!.push(node);
+          } else {
+            tree.push(node);
+          }
+
+          parent = node;
+        } else {
+          parent = pathMap.get(currentPath)!;
+        }
+      }
+    }
+
+    return tree;
+  };
+
+  const toggleExpand = (path: string) => {
+    setExpandedPaths((prev) => {
+      const next = new Set(prev);
+      if (next.has(path)) {
+        next.delete(path);
+      } else {
+        next.add(path);
+      }
+      return next;
+    });
+  };
+
+  const expandAll = () => {
+    const allPaths = new Set<string>();
+    const collectPaths = (nodes: FileNode[]) => {
+      nodes.forEach(node => {
+        if (node.type === 'directory' && node.children) {
+          allPaths.add(node.path);
+          if (node.children.length > 0) {
+            collectPaths(node.children);
+          }
+        }
+      });
+    };
+    collectPaths(files);
+    setExpandedPaths(allPaths);
+  };
+
+  const collapseAll = () => {
+    setExpandedPaths(new Set());
+  };
+
+  const formatFileSize = (bytes?: number): string => {
+    if (!bytes) return '';
+    if (bytes < 1024) return `${bytes} B`;
+    if (bytes < 1024 * 1024) return `${(bytes / 1024).toFixed(1)} KB`;
+    if (bytes < 1024 * 1024 * 1024) return `${(bytes / (1024 * 1024)).toFixed(1)} MB`;
+    return `${(bytes / (1024 * 1024 * 1024)).toFixed(1)} GB`;
+  };
+
+  // Get all file extensions from the tree
+  const getAllFileExtensions = useMemo(() => {
+    const extensions = new Set<string>();
+    const collectExtensions = (nodes: FileNode[]) => {
+      nodes.forEach(node => {
+        if (node.type === 'file') {
+          const ext = node.path.split('.').pop()?.toLowerCase();
+          if (ext) extensions.add(ext);
+        }
+        if (node.children) {
+          collectExtensions(node.children);
+        }
+      });
+    };
+    collectExtensions(files);
+    return Array.from(extensions).sort();
+  }, [files]);
+
+  // Auto-expand directories when searching
+  useEffect(() => {
+    if (searchQuery) {
+      const pathsToExpand = new Set<string>();
+      const findMatchingPaths = (nodes: FileNode[], query: string) => {
+        nodes.forEach(node => {
+          if (node.path.toLowerCase().includes(query.toLowerCase())) {
+            // Expand all parent directories
+            const parts = node.path.split('/');
+            let currentPath = '';
+            for (let i = 0; i < parts.length - 1; i++) {
+              currentPath = currentPath ? `${currentPath}/${parts[i]}` : parts[i];
+              pathsToExpand.add(currentPath);
+            }
+          }
+          if (node.children) {
+            findMatchingPaths(node.children, query);
+          }
+        });
+      };
+      findMatchingPaths(files, searchQuery);
+      setExpandedPaths(pathsToExpand);
+    }
+  }, [searchQuery, files]);
+
+  // Filter files based on search and file type
+  const filterNodes = (nodes: FileNode[]): FileNode[] => {
+    return nodes
+      .map(node => {
+        const matchesSearch = !searchQuery || 
+          node.path.toLowerCase().includes(searchQuery.toLowerCase());
+        const matchesType = fileTypeFilter === 'all' || 
+          (node.type === 'file' && node.path.toLowerCase().endsWith(`.${fileTypeFilter}`)) ||
+          (node.type === 'directory');
+        
+        if (!matchesSearch || !matchesType) {
+          return null;
+        }
+
+        const filteredChildren = node.children ? filterNodes(node.children) : undefined;
+        const result: FileNode | null = filteredChildren && filteredChildren.length > 0
+          ? { ...node, children: filteredChildren }
+          : filteredChildren === undefined && matchesSearch && matchesType
+          ? { ...node }
+          : null;
+        return result;
+      })
+      .filter((node): node is FileNode => node !== null);
+  };
+
+  const filteredFiles = useMemo(() => {
+    if (!searchQuery && fileTypeFilter === 'all') return files;
+    return filterNodes(files);
+  }, [files, searchQuery, fileTypeFilter]);
+
+  // Count total files
+  const countFiles = (nodes: FileNode[]): number => {
+    let count = 0;
+    nodes.forEach(node => {
+      if (node.type === 'file') count++;
+      if (node.children) count += countFiles(node.children);
+    });
+    return count;
+  };
+
+  const totalFileCount = useMemo(() => countFiles(files), [files]);
+  const visibleFileCount = useMemo(() => countFiles(filteredFiles), [filteredFiles]);
+
+  // Keyboard shortcut for search (Cmd+K / Ctrl+K)
+  useEffect(() => {
+    const handleKeyDown = (e: KeyboardEvent) => {
+      if ((e.metaKey || e.ctrlKey) && e.key === 'k') {
+        e.preventDefault();
+        setShowSearch(true);
+        setTimeout(() => searchInputRef.current?.focus(), 0);
+      }
+      if (e.key === 'Escape' && showSearch) {
+        setShowSearch(false);
+        setSearchQuery('');
+      }
+    };
+    window.addEventListener('keydown', handleKeyDown);
+    return () => window.removeEventListener('keydown', handleKeyDown);
+  }, [showSearch]);
+
+  const getFileIcon = (node: FileNode): string => {
+    if (node.type === 'directory') {
+      return expandedPaths.has(node.path) ? '📂' : '📁';
+    }
+    const ext = node.path.split('.').pop()?.toLowerCase();
+    const iconMap: Record<string, string> = {
+      'py': '🐍',
+      'json': '📄',
+      'txt': '📝',
+      'md': '📖',
+      'yml': '⚙️',
+      'yaml': '⚙️',
+      'bin': '💾',
+      'safetensors': '🔒',
+      'pt': '🔥',
+      'pth': '🔥',
+      'onnx': '🧠',
+      'pb': '🧠',
+    };
+    return iconMap[ext || ''] || '📄';
+  };
+
+  const copyFilePath = (path: string) => {
+    navigator.clipboard.writeText(path).then(() => {
+      // Show temporary feedback
+      const button = document.querySelector(`[data-file-path="${path}"]`) as HTMLElement;
+      if (button) {
+        const originalText = button.textContent;
+        button.textContent = 'Copied!';
+        setTimeout(() => {
+          if (button) button.textContent = originalText;
+        }, 1000);
+      }
+    });
+  };
+
+  const getFileUrl = (path: string) => {
+    return `https://huggingface.co/${modelId}/resolve/main/${path}`;
+  };
+
+  const renderNode = (node: FileNode, depth: number = 0): React.ReactNode => {
+    const isExpanded = expandedPaths.has(node.path);
+    const hasChildren = node.children && node.children.length > 0;
+    const fileName = node.path.split('/').pop() || node.path;
+
+    return (
+      <div key={node.path} className="file-tree-node" style={{ paddingLeft: `${depth * 1.5}rem` }}>
+        <div
+          className={`file-tree-item ${node.type} ${isExpanded ? 'expanded' : ''}`}
+          onClick={() => node.type === 'directory' && toggleExpand(node.path)}
+          style={{ cursor: node.type === 'directory' ? 'pointer' : 'default' }}
+        >
+          <span className="file-icon">{getFileIcon(node)}</span>
+          <span className="file-name" title={node.path}>{fileName}</span>
+          {node.type === 'file' && node.size && (
+            <span className="file-size">{formatFileSize(node.size)}</span>
+          )}
+          {node.type === 'directory' && (
+            <span className="file-expand">{isExpanded ? '▼' : '▶'}</span>
+          )}
+          {node.type === 'file' && (
+            <div className="file-actions" onClick={(e) => e.stopPropagation()}>
+              <button
+                className="file-action-btn"
+                onClick={() => copyFilePath(node.path)}
+                data-file-path={node.path}
+                title="Copy file path"
+                aria-label="Copy path"
+              >
+                📋
+              </button>
+              <a
+                href={getFileUrl(node.path)}
+                target="_blank"
+                rel="noopener noreferrer"
+                className="file-action-btn"
+                title="Download file"
+                aria-label="Download"
+                onClick={(e) => e.stopPropagation()}
+              >
+                ⬇️
+              </a>
+            </div>
+          )}
+        </div>
+        {isExpanded && hasChildren && (
+          <div className="file-tree-children">
+            {node.children!.map((child) => renderNode(child, depth + 1))}
+          </div>
+        )}
+      </div>
+    );
+  };
+
+  if (loading) {
+    return (
+      <div className="file-tree-container">
+        <div className="file-tree-loading">Loading file tree...</div>
+      </div>
+    );
+  }
+
+  if (error) {
+    return (
+      <div className="file-tree-container">
+        <div className="file-tree-error">
+          {error}
+          <div style={{ marginTop: '0.5rem', fontSize: '0.85rem', color: '#666' }}>
+            File tree may not be available for this model.
+          </div>
+        </div>
+      </div>
+    );
+  }
+
+  if (files.length === 0) {
+    return (
+      <div className="file-tree-container">
+        <div className="file-tree-empty">No files found</div>
+      </div>
+    );
+  }
+
+  const hasDirectories = files.some(node => node.type === 'directory');
+
+  return (
+    <div className="file-tree-container">
+      <div className="file-tree-header">
+        <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
+          <strong>Repository Files</strong>
+          <span className="file-count-badge">
+            {visibleFileCount === totalFileCount 
+              ? `${totalFileCount} file${totalFileCount !== 1 ? 's' : ''}`
+              : `${visibleFileCount} of ${totalFileCount} files`}
+          </span>
+        </div>
+        <div style={{ display: 'flex', gap: '0.5rem', alignItems: 'center', flexWrap: 'wrap' }}>
+          <button
+            onClick={() => setShowSearch(!showSearch)}
+            className="file-tree-button"
+            title="Search files (Cmd+K)"
+            aria-label="Search"
+          >
+            🔍 Search
+          </button>
+          {hasDirectories && (
+            <>
+              <button
+                onClick={expandAll}
+                className="file-tree-button"
+                title="Expand all directories"
+                aria-label="Expand all"
+              >
+                Expand All
+              </button>
+              <button
+                onClick={collapseAll}
+                className="file-tree-button"
+                title="Collapse all directories"
+                aria-label="Collapse all"
+              >
+                Collapse All
+              </button>
+            </>
+          )}
+          <a
+            href={getHuggingFaceFileTreeUrl(modelId, 'main')}
+            target="_blank"
+            rel="noopener noreferrer"
+            className="file-tree-link"
+          >
+            View on HF →
+          </a>
+        </div>
+      </div>
+
+      {/* Search and Filter Bar */}
+      {(showSearch || searchQuery || fileTypeFilter !== 'all') && (
+        <div className="file-tree-filters">
+          <div className="file-tree-search">
+            <input
+              ref={searchInputRef}
+              type="text"
+              placeholder="Search files... (Cmd+K)"
+              value={searchQuery}
+              onChange={(e) => setSearchQuery(e.target.value)}
+              className="file-tree-search-input"
+            />
+            {searchQuery && (
+              <button
+                onClick={() => setSearchQuery('')}
+                className="file-tree-clear"
+                aria-label="Clear search"
+              >
+                ✕
+              </button>
+            )}
+          </div>
+          {getAllFileExtensions.length > 0 && (
+            <select
+              value={fileTypeFilter}
+              onChange={(e) => setFileTypeFilter(e.target.value)}
+              className="file-tree-type-filter"
+            >
+              <option value="all">All file types</option>
+              {getAllFileExtensions.map(ext => (
+                <option key={ext} value={ext}>.{ext}</option>
+              ))}
+            </select>
+          )}
+        </div>
+      )}
+
+      <div className="file-tree">
+        {filteredFiles.length === 0 ? (
+          <div className="file-tree-empty">
+            {searchQuery || fileTypeFilter !== 'all' 
+              ? 'No files match your filters'
+              : 'No files found'}
+          </div>
+        ) : (
+          filteredFiles.map((node) => renderNode(node))
+        )}
+      </div>
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/ModelModal.css b/frontend/src/components/modals/ModelModal.css
similarity index 87%
rename from frontend/src/components/ModelModal.css
rename to frontend/src/components/modals/ModelModal.css
index 4ec208ec0271780ab8b24c4ca5b91577b3c11a18..5dff42a03836db1abf78ef55536a2f67254137ec 100644
--- a/frontend/src/components/ModelModal.css
+++ b/frontend/src/components/modals/ModelModal.css
@@ -25,7 +25,7 @@
 .modal-content {
   background: #ffffff;
   border-radius: 8px;
-  max-width: 800px;
+  max-width: 900px;
   width: 100%;
   max-height: 90vh;
   overflow-y: auto;
@@ -34,11 +34,16 @@
   box-shadow: 0 8px 32px rgba(0, 0, 0, 0.2);
   border: 1px solid #d0d0d0;
   animation: slideUp 0.3s ease-out;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
   display: flex;
   flex-direction: column;
 }
 
+.modal-content[data-tab="files"] {
+  max-width: 1000px;
+  max-height: 95vh;
+}
+
 @keyframes slideUp {
   from {
     transform: translateY(20px);
@@ -66,7 +71,7 @@
   justify-content: center;
   border-radius: 2px;
   transition: all 0.2s;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .modal-close:hover {
@@ -89,7 +94,7 @@
   font-size: 1.5rem;
   color: #1a1a1a;
   word-break: break-word;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
   font-weight: 600;
   line-height: 1.3;
 }
@@ -117,7 +122,7 @@
   border-radius: 4px;
   cursor: pointer;
   font-size: 0.85rem;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
   transition: all 0.2s;
   font-weight: 500;
 }
@@ -136,6 +141,12 @@
   gap: 0.5rem;
   margin-bottom: 1.5rem;
   border-bottom: 2px solid #e0e0e0;
+  position: sticky;
+  top: 0;
+  background: #ffffff;
+  z-index: 10;
+  padding-top: 0.5rem;
+  margin-top: -0.5rem;
 }
 
 .modal-tab {
@@ -145,11 +156,29 @@
   border-bottom: 2px solid transparent;
   cursor: pointer;
   font-size: 0.9rem;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
   color: #666;
   font-weight: 500;
   margin-bottom: -2px;
   transition: all 0.2s;
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  position: relative;
+}
+
+.tab-icon {
+  font-size: 1rem;
+}
+
+.tab-badge {
+  background: #4a90e2;
+  color: white;
+  font-size: 0.7rem;
+  padding: 0.15rem 0.4rem;
+  border-radius: 10px;
+  font-weight: 600;
+  margin-left: 0.25rem;
 }
 
 .modal-tab:hover {
@@ -186,14 +215,14 @@
   text-transform: uppercase;
   letter-spacing: 0.5px;
   font-weight: 600;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .info-value {
   font-size: 1.1rem;
   color: #1a1a1a;
   font-weight: 500;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .info-value.highlight {
@@ -230,7 +259,7 @@
   letter-spacing: 0.5px;
   font-weight: 600;
   margin-bottom: 0.75rem;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .section-content {
@@ -287,7 +316,7 @@
   color: #4a4a4a;
   text-transform: uppercase;
   letter-spacing: 0.5px;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .modal-info-grid {
@@ -306,14 +335,14 @@
   font-size: 0.875rem;
   color: #6a6a6a;
   font-weight: 500;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .modal-info-item span {
   font-size: 1rem;
   color: #1a1a1a;
   font-weight: 500;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .modal-tags {
@@ -324,7 +353,7 @@
   color: #1a1a1a;
   font-size: 0.9rem;
   line-height: 1.5;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
 }
 
 .modal-footer {
@@ -345,7 +374,7 @@
   text-decoration: none;
   border-radius: 4px;
   font-weight: 500;
-  font-family: 'Vend Sans', sans-serif;
+  font-family: 'Instrument Sans', sans-serif;
   transition: all 0.2s;
   border: 1px solid #1a1a1a;
 }
diff --git a/frontend/src/components/ModelModal.tsx b/frontend/src/components/modals/ModelModal.tsx
similarity index 95%
rename from frontend/src/components/ModelModal.tsx
rename to frontend/src/components/modals/ModelModal.tsx
index 2159ffccd3da35a6fc1f27c74d27385ea8ccab71..55100f260fa480a3b6799ef3eb9cfcd05f8d94b0 100644
--- a/frontend/src/components/ModelModal.tsx
+++ b/frontend/src/components/modals/ModelModal.tsx
@@ -3,12 +3,12 @@
  * Enhanced with bookmark, comparison, similar models, and file tree features.
  */
 import React, { useState, useEffect } from 'react';
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 import FileTree from './FileTree';
+import { getHuggingFaceUrl } from '../../utils/api/hfUrl';
+import { API_BASE } from '../../config/api';
 import './ModelModal.css';
 
-const API_BASE = process.env.REACT_APP_API_URL || 'http://localhost:8000';
-
 interface ArxivPaper {
   arxiv_id: string;
   title: string;
@@ -71,7 +71,7 @@ export default function ModelModal({
 
   if (!isOpen || !model) return null;
 
-  const hfUrl = `https://huggingface.co/${model.model_id}`;
+  const hfUrl = getHuggingFaceUrl(model.model_id);
 
   // Parse tags if it's a string representation of an array
   const parseTags = (tags: string | null | undefined): string[] => {
@@ -156,7 +156,11 @@ export default function ModelModal({
 
   return (
     <div className="modal-overlay" onClick={onClose}>
-      <div className="modal-content" onClick={(e) => e.stopPropagation()}>
+      <div 
+        className="modal-content" 
+        onClick={(e) => e.stopPropagation()}
+        data-tab={activeTab}
+      >
         <div className="modal-header">
           <h2>{model.model_id}</h2>
           <button className="modal-close" onClick={onClose}>Close</button>
@@ -197,20 +201,24 @@ export default function ModelModal({
               className={`modal-tab ${activeTab === 'details' ? 'active' : ''}`}
               onClick={() => setActiveTab('details')}
             >
-              Details
+              <span className="tab-icon">📋</span>
+              <span>Details</span>
             </button>
             <button
               className={`modal-tab ${activeTab === 'files' ? 'active' : ''}`}
               onClick={() => setActiveTab('files')}
             >
-              Files
+              <span className="tab-icon">📁</span>
+              <span>Files</span>
             </button>
             {(papers.length > 0 || papersLoading) && (
               <button
                 className={`modal-tab ${activeTab === 'papers' ? 'active' : ''}`}
                 onClick={() => setActiveTab('papers')}
               >
-                Papers {papers.length > 0 && `(${papers.length})`}
+                <span className="tab-icon">📄</span>
+                <span>Papers</span>
+                {papers.length > 0 && <span className="tab-badge">{papers.length}</span>}
               </button>
             )}
           </div>
@@ -283,7 +291,7 @@ export default function ModelModal({
                   <div className="section-title">Parent Model</div>
                   <div className="section-content">
                     <a
-                      href={`https://huggingface.co/${model.parent_model}`}
+                      href={getHuggingFaceUrl(model.parent_model)}
                       target="_blank"
                       rel="noopener noreferrer"
                       className="model-link"
diff --git a/frontend/src/components/ColorLegend.css b/frontend/src/components/ui/ColorLegend.css
similarity index 100%
rename from frontend/src/components/ColorLegend.css
rename to frontend/src/components/ui/ColorLegend.css
diff --git a/frontend/src/components/ColorLegend.tsx b/frontend/src/components/ui/ColorLegend.tsx
similarity index 99%
rename from frontend/src/components/ColorLegend.tsx
rename to frontend/src/components/ui/ColorLegend.tsx
index fcff0753c630062fd8cd58e6df2f6c4face5df01..aa84290c637fc7d76196c82e74a33beee7e44603 100644
--- a/frontend/src/components/ColorLegend.tsx
+++ b/frontend/src/components/ui/ColorLegend.tsx
@@ -3,7 +3,7 @@
  * Shows color mappings for categorical and continuous data.
  */
 import React from 'react';
-import { getCategoricalColorMap, getContinuousColorScale } from '../utils/colors';
+import { getCategoricalColorMap, getContinuousColorScale } from '../../utils/rendering/colors';
 import './ColorLegend.css';
 
 interface ColorLegendProps {
diff --git a/frontend/src/components/ErrorBoundary.tsx b/frontend/src/components/ui/ErrorBoundary.tsx
similarity index 100%
rename from frontend/src/components/ErrorBoundary.tsx
rename to frontend/src/components/ui/ErrorBoundary.tsx
diff --git a/frontend/src/components/LiveModelCount.css b/frontend/src/components/ui/LiveModelCount.css
similarity index 89%
rename from frontend/src/components/LiveModelCount.css
rename to frontend/src/components/ui/LiveModelCount.css
index 4dcbcd873b57d1dbdacc17038dff8b966b6be782..ef343ce779ff47c696291e8e3ccd771534291bc8 100644
--- a/frontend/src/components/LiveModelCount.css
+++ b/frontend/src/components/ui/LiveModelCount.css
@@ -76,10 +76,9 @@
 .live-model-count-full {
   background: white;
   border: 1px solid #e0e0e0;
-  border-radius: 8px;
+  border-radius: 6px;
   padding: 1rem;
   margin-bottom: 1rem;
-  box-shadow: 0 1px 3px rgba(0, 0, 0, 0.05);
 }
 
 .count-header {
@@ -91,11 +90,10 @@
 
 .count-header h4 {
   margin: 0;
-  font-size: 0.95rem;
+  font-size: 0.9rem;
   font-weight: 600;
-  color: #2a2a2a;
-  text-transform: uppercase;
-  letter-spacing: 0.05em;
+  color: #2d2d2d;
+  letter-spacing: -0.01em;
 }
 
 .refresh-btn-small {
@@ -134,17 +132,16 @@
 .count-display {
   text-align: center;
   padding: 1.25rem 1rem;
-  background: linear-gradient(135deg, #1a1a1a 0%, #2d2d2d 100%);
-  border-radius: 8px;
+  background: #2d2d2d;
+  border-radius: 6px;
   color: white;
-  border: 1px solid #3a3a3a;
+  border: 1px solid #404040;
 }
 
 .count-number {
   font-size: 2.5rem;
   font-weight: 700;
   margin-bottom: 0.5rem;
-  text-shadow: 0 2px 4px rgba(0, 0, 0, 0.3);
   letter-spacing: -0.02em;
 }
 
diff --git a/frontend/src/components/LiveModelCount.tsx b/frontend/src/components/ui/LiveModelCount.tsx
similarity index 87%
rename from frontend/src/components/LiveModelCount.tsx
rename to frontend/src/components/ui/LiveModelCount.tsx
index b38a503f50129d0ca597de983a0ff61bece7bc8a..26516be66f71deeeec72cdd03f06d207a41839f2 100644
--- a/frontend/src/components/LiveModelCount.tsx
+++ b/frontend/src/components/ui/LiveModelCount.tsx
@@ -1,11 +1,19 @@
 /**
  * Compact live model count display for header.
  * Shows current model count from Hugging Face Hub with auto-refresh.
+ * Gets live count from HF models page, breakdowns from dataset.
  */
 import React, { useState, useEffect } from 'react';
+import { API_BASE } from '../../config/api';
 import './LiveModelCount.css';
 
-const API_BASE = process.env.REACT_APP_API_URL || 'http://localhost:8000';
+const logger = {
+  error: (message: string, error?: unknown) => {
+    if (process.env.NODE_ENV === 'development') {
+      console.error(message, error);
+    }
+  },
+};
 
 interface ModelCount {
   total_models: number;
@@ -21,8 +29,10 @@ export default function LiveModelCount({ compact = true }: { compact?: boolean }
 
   const fetchCurrentCount = async () => {
     try {
-      // Use dataset snapshot for faster response (like ai-ecosystem approach)
-      const response = await fetch(`${API_BASE}/api/model-count/current?use_dataset_snapshot=true&use_cache=true`);
+      // First try: Get count from HF models page (fastest, most accurate)
+      // This gets the live count from https://huggingface.co/models
+      // Breakdowns come from dataset snapshot to maintain database structure
+      const response = await fetch(`${API_BASE}/api/model-count/current?use_models_page=true&use_dataset_snapshot=true&use_cache=true`);
       if (!response.ok) throw new Error('Failed to fetch model count');
       const data = await response.json();
       setCurrentCount(data);
@@ -30,7 +40,7 @@ export default function LiveModelCount({ compact = true }: { compact?: boolean }
       setError(null);
     } catch (err) {
       setError(err instanceof Error ? err.message : 'Unknown error');
-      // Try API as fallback
+      // Fallback: Try without models page scraping
       try {
         const response = await fetch(`${API_BASE}/api/model-count/current?use_cache=true`);
         if (response.ok) {
@@ -40,7 +50,7 @@ export default function LiveModelCount({ compact = true }: { compact?: boolean }
           setError(null);
         }
       } catch (fallbackErr) {
-        console.error('Fallback fetch also failed:', fallbackErr);
+        logger.error('Fallback fetch also failed:', fallbackErr);
       }
     }
   };
diff --git a/frontend/src/components/ModelCountTracker.css b/frontend/src/components/ui/ModelCountTracker.css
similarity index 100%
rename from frontend/src/components/ModelCountTracker.css
rename to frontend/src/components/ui/ModelCountTracker.css
diff --git a/frontend/src/components/ModelCountTracker.tsx b/frontend/src/components/ui/ModelCountTracker.tsx
similarity index 98%
rename from frontend/src/components/ModelCountTracker.tsx
rename to frontend/src/components/ui/ModelCountTracker.tsx
index 7e0e4cd80f9ad451e3cf0b9a08ed001403169723..4a29b19437d48511b37fabd628bbaece34fc7373 100644
--- a/frontend/src/components/ModelCountTracker.tsx
+++ b/frontend/src/components/ui/ModelCountTracker.tsx
@@ -5,7 +5,7 @@
 import React, { useState, useEffect } from 'react';
 import './ModelCountTracker.css';
 
-const API_BASE = process.env.REACT_APP_API_URL || 'http://localhost:8000';
+import { API_BASE } from '../../config/api';
 
 interface ModelCount {
   total_models: number;
diff --git a/frontend/src/components/ModelTooltip.tsx b/frontend/src/components/ui/ModelTooltip.tsx
similarity index 86%
rename from frontend/src/components/ModelTooltip.tsx
rename to frontend/src/components/ui/ModelTooltip.tsx
index e4b30a043298c393dc748b2d659bfad3278d3f60..8e3f4acda3fc640aba0a52e962e07a2355406778 100644
--- a/frontend/src/components/ModelTooltip.tsx
+++ b/frontend/src/components/ui/ModelTooltip.tsx
@@ -2,7 +2,8 @@
  * Tooltip component for displaying model information when hovering over points in 3D plot
  */
 import React, { useEffect, useState } from 'react';
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
+import { getHuggingFaceApiUrl } from '../../utils/api/hfUrl';
 
 interface ModelTooltipProps {
   model: ModelPoint | null;
@@ -16,7 +17,20 @@ interface ModelDetails {
   error?: string;
 }
 
-const API_BASE = process.env.REACT_APP_API_URL || 'http://localhost:8000';
+function formatDate(dateString: string | null): string {
+  if (!dateString) return '';
+  try {
+    const date = new Date(dateString);
+    if (isNaN(date.getTime())) return dateString; // Return original if invalid
+    return date.toLocaleDateString('en-US', { 
+      year: 'numeric', 
+      month: 'short', 
+      day: 'numeric' 
+    });
+  } catch {
+    return dateString;
+  }
+}
 
 export default function ModelTooltip({ model, position, visible }: ModelTooltipProps) {
   const [details, setDetails] = useState<ModelDetails>({});
@@ -52,7 +66,7 @@ export default function ModelTooltip({ model, position, visible }: ModelTooltipP
           headers['Authorization'] = `Bearer ${hfToken}`;
         }
         
-        const response = await fetch(`https://huggingface.co/api/models/${model.model_id}`, {
+        const response = await fetch(getHuggingFaceApiUrl(model.model_id), {
           headers,
         });
         
@@ -130,6 +144,11 @@ export default function ModelTooltip({ model, position, visible }: ModelTooltipP
           <span style={{ color: '#888' }}>Downloads:</span> {model.downloads.toLocaleString()} | 
           <span style={{ color: '#888', marginLeft: '8px' }}>Likes:</span> {model.likes.toLocaleString()}
         </div>
+        {model.created_at && (
+          <div style={{ marginBottom: '4px', fontSize: '11px', color: '#aaa' }}>
+            <span style={{ color: '#888' }}>Created:</span> {formatDate(model.created_at)}
+          </div>
+        )}
         {model.parent_model && (
           <div style={{ marginBottom: '4px', fontSize: '11px', color: '#aaa' }}>
             <span style={{ color: '#888' }}>Parent:</span> {model.parent_model}
diff --git a/frontend/src/components/visualizations/DistanceHeatmap.tsx b/frontend/src/components/visualizations/DistanceHeatmap.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..5da78ca70e1b34d23cdbd286bcc6400dedad7d1c
--- /dev/null
+++ b/frontend/src/components/visualizations/DistanceHeatmap.tsx
@@ -0,0 +1,83 @@
+/**
+ * Distance heatmap overlay for 3D visualization.
+ * Shows distance gradients from selected point.
+ */
+import React, { useMemo } from 'react';
+import { ModelPoint } from '../../types';
+
+interface DistanceHeatmapProps {
+  data: ModelPoint[];
+  selectedModel: ModelPoint | null;
+  width: number;
+  height: number;
+  opacity?: number;
+}
+
+export default function DistanceHeatmap({
+  data,
+  selectedModel,
+  width,
+  height,
+  opacity = 0.3
+}: DistanceHeatmapProps) {
+  const distances = useMemo(() => {
+    if (!selectedModel) return null;
+    
+    const dists = data.map(point => {
+      const dx = point.x - selectedModel.x;
+      const dy = point.y - selectedModel.y;
+      const dz = point.z - selectedModel.z;
+      return Math.sqrt(dx * dx + dy * dy + dz * dz);
+    });
+    
+    const maxDist = Math.max(...dists);
+    const minDist = Math.min(...dists);
+    
+    return {
+      distances: dists,
+      maxDist,
+      minDist,
+      range: maxDist - minDist || 1
+    };
+  }, [data, selectedModel]);
+  
+  if (!selectedModel || !distances) return null;
+  
+  return (
+    <div
+      style={{
+        position: 'absolute',
+        top: 0,
+        left: 0,
+        width,
+        height,
+        pointerEvents: 'none',
+        zIndex: 1
+      }}
+    >
+      <div
+        style={{
+          position: 'absolute',
+          bottom: 10,
+          left: 10,
+          background: 'rgba(0, 0, 0, 0.7)',
+          color: 'white',
+          padding: '8px 12px',
+          borderRadius: '4px',
+          fontSize: '11px',
+          fontFamily: "'Instrument Sans', sans-serif"
+        }}
+      >
+        <div style={{ fontWeight: 600, marginBottom: '4px' }}>Distance Heatmap</div>
+        <div style={{ fontSize: '10px', opacity: 0.9 }}>
+          Showing distance from: <strong>{selectedModel.model_id}</strong>
+        </div>
+        <div style={{ fontSize: '10px', opacity: 0.8, marginTop: '4px' }}>
+          Range: {distances.minDist.toFixed(2)} - {distances.maxDist.toFixed(2)}
+        </div>
+      </div>
+    </div>
+  );
+}
+
+
diff --git a/frontend/src/components/visualizations/DistributionView.css b/frontend/src/components/visualizations/DistributionView.css
new file mode 100644
index 0000000000000000000000000000000000000000..a423e95a348107dc9eed8c64e60e7ff34b32a061
--- /dev/null
+++ b/frontend/src/components/visualizations/DistributionView.css
@@ -0,0 +1,98 @@
+.distribution-view {
+  padding: 1rem;
+  width: 100%;
+  height: 100%;
+  overflow-y: auto;
+}
+
+.distribution-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  margin-bottom: 1.5rem;
+}
+
+.distribution-header h3 {
+  margin: 0;
+  font-size: 1.25rem;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.distribution-stats {
+  font-size: 0.9rem;
+  color: var(--text-secondary, #666);
+}
+
+.distribution-grid {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(300px, 1fr));
+  gap: 1.5rem;
+}
+
+.distribution-chart {
+  background: var(--bg-primary, #ffffff);
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 8px;
+  padding: 1rem;
+}
+
+.distribution-chart-title {
+  margin: 0 0 1rem 0;
+  font-size: 1rem;
+  font-weight: 600;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.distribution-bars {
+  display: flex;
+  flex-direction: column;
+  gap: 0.5rem;
+}
+
+.distribution-bar-container {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+}
+
+.distribution-bar-label {
+  min-width: 100px;
+  font-size: 0.85rem;
+  color: var(--text-secondary, #666);
+  text-align: right;
+}
+
+.distribution-bar-wrapper {
+  flex: 1;
+  height: 24px;
+  background: var(--bg-secondary, #f5f5f5);
+  border-radius: 4px;
+  overflow: hidden;
+  position: relative;
+}
+
+.distribution-bar {
+  height: 100%;
+  background: linear-gradient(90deg, var(--accent-color, #4a90e2), #6ba3e8);
+  border-radius: 4px;
+  display: flex;
+  align-items: center;
+  justify-content: flex-end;
+  padding-right: 0.5rem;
+  transition: width 0.3s ease;
+  min-width: 40px;
+}
+
+.distribution-bar-value {
+  font-size: 0.75rem;
+  font-weight: 600;
+  color: white;
+  text-shadow: 0 1px 2px rgba(0, 0, 0, 0.2);
+}
+
+.distribution-empty {
+  padding: 2rem;
+  text-align: center;
+  color: var(--text-secondary, #666);
+}
+
diff --git a/frontend/src/components/visualizations/DistributionView.tsx b/frontend/src/components/visualizations/DistributionView.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..b3f96a8c7f3d0a4357d04758f7e15bfb804fba62
--- /dev/null
+++ b/frontend/src/components/visualizations/DistributionView.tsx
@@ -0,0 +1,130 @@
+/**
+ * Distribution view showing statistical distributions of model properties.
+ * Uses D3.js for rendering (no external chart library needed).
+ */
+import React, { useMemo } from 'react';
+import { ModelPoint } from '../../types';
+import './DistributionView.css';
+
+interface DistributionViewProps {
+  data: ModelPoint[];
+  width?: number;
+  height?: number;
+}
+
+export default function DistributionView({ data, width = 800, height = 400 }: DistributionViewProps) {
+  const distributions = useMemo(() => {
+    if (data.length === 0) return null;
+
+    // Library distribution
+    const libraryDist = data.reduce((acc, model) => {
+      const lib = model.library_name || 'Unknown';
+      acc[lib] = (acc[lib] || 0) + 1;
+      return acc;
+    }, {} as Record<string, number>);
+
+    // Pipeline tag distribution
+    const pipelineDist = data.reduce((acc, model) => {
+      const pipeline = model.pipeline_tag || 'Unknown';
+      acc[pipeline] = (acc[pipeline] || 0) + 1;
+      return acc;
+    }, {} as Record<string, number>);
+
+    // Downloads distribution (log scale buckets)
+    const downloadsDist = data.reduce((acc, model) => {
+      const downloads = model.downloads || 0;
+      if (downloads === 0) {
+        acc['0'] = (acc['0'] || 0) + 1;
+      } else {
+        const bucket = Math.floor(Math.log10(downloads));
+        const label = `10^${bucket}`;
+        acc[label] = (acc[label] || 0) + 1;
+      }
+      return acc;
+    }, {} as Record<string, number>);
+
+    // Likes distribution (log scale buckets)
+    const likesDist = data.reduce((acc, model) => {
+      const likes = model.likes || 0;
+      if (likes === 0) {
+        acc['0'] = (acc['0'] || 0) + 1;
+      } else {
+        const bucket = Math.floor(Math.log10(likes));
+        const label = `10^${bucket}`;
+        acc[label] = (acc[label] || 0) + 1;
+      }
+      return acc;
+    }, {} as Record<string, number>);
+
+    return {
+      library: Object.entries(libraryDist)
+        .sort((a, b) => b[1] - a[1])
+        .slice(0, 10)
+        .map(([name, count]) => ({ name, count })),
+      pipeline: Object.entries(pipelineDist)
+        .sort((a, b) => b[1] - a[1])
+        .slice(0, 10)
+        .map(([name, count]) => ({ name, count })),
+      downloads: Object.entries(downloadsDist)
+        .sort((a, b) => parseInt(a[0].replace('10^', '')) - parseInt(b[0].replace('10^', '')))
+        .map(([name, count]) => ({ name, count })),
+      likes: Object.entries(likesDist)
+        .sort((a, b) => parseInt(a[0].replace('10^', '')) - parseInt(b[0].replace('10^', '')))
+        .map(([name, count]) => ({ name, count })),
+    };
+  }, [data]);
+
+  if (!distributions) {
+    return (
+      <div className="distribution-view">
+        <div className="distribution-empty">No data to display</div>
+      </div>
+    );
+  }
+
+  const maxCount = Math.max(
+    ...distributions.library.map(d => d.count),
+    ...distributions.pipeline.map(d => d.count),
+    ...distributions.downloads.map(d => d.count),
+    ...distributions.likes.map(d => d.count)
+  );
+
+  const BarChart = ({ data, title }: { data: Array<{ name: string; count: number }>; title: string }) => (
+    <div className="distribution-chart">
+      <h4 className="distribution-chart-title">{title}</h4>
+      <div className="distribution-bars">
+        {data.map((item, idx) => (
+          <div key={idx} className="distribution-bar-container">
+            <div className="distribution-bar-label">{item.name}</div>
+            <div className="distribution-bar-wrapper">
+              <div
+                className="distribution-bar"
+                style={{ width: `${(item.count / maxCount) * 100}%` }}
+              >
+                <span className="distribution-bar-value">{item.count.toLocaleString()}</span>
+              </div>
+            </div>
+          </div>
+        ))}
+      </div>
+    </div>
+  );
+
+  return (
+    <div className="distribution-view">
+      <div className="distribution-header">
+        <h3>Model Distributions</h3>
+        <div className="distribution-stats">
+          Total Models: {data.length.toLocaleString()}
+        </div>
+      </div>
+      <div className="distribution-grid">
+        <BarChart data={distributions.library} title="Top Libraries" />
+        <BarChart data={distributions.pipeline} title="Top Pipeline Tags" />
+        <BarChart data={distributions.downloads} title="Downloads Distribution" />
+        <BarChart data={distributions.likes} title="Likes Distribution" />
+      </div>
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/EnhancedScatterPlot.tsx b/frontend/src/components/visualizations/EnhancedScatterPlot.tsx
similarity index 99%
rename from frontend/src/components/EnhancedScatterPlot.tsx
rename to frontend/src/components/visualizations/EnhancedScatterPlot.tsx
index 7c3e463d439d419921982cc8f51d52e3aa287d17..9115e9c3f527e9c8590041082613258ea46b7503 100644
--- a/frontend/src/components/EnhancedScatterPlot.tsx
+++ b/frontend/src/components/visualizations/EnhancedScatterPlot.tsx
@@ -4,7 +4,7 @@
  */
 import React, { useMemo, useRef, useEffect, useState, useCallback } from 'react';
 import * as d3 from 'd3';
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 
 interface EnhancedScatterPlotProps {
   width: number;
@@ -627,7 +627,7 @@ export default function EnhancedScatterPlot({
           padding: '4px 8px',
           borderRadius: '2px',
           border: '1px solid #d0d0d0',
-          fontFamily: "'Vend Sans', sans-serif",
+          fontFamily: "'Instrument Sans', sans-serif",
         }}
       >
         <strong>Navigation:</strong> Scroll to zoom | Drag to pan | Click + drag to select
diff --git a/frontend/src/components/visualizations/HeatmapView.css b/frontend/src/components/visualizations/HeatmapView.css
new file mode 100644
index 0000000000000000000000000000000000000000..128a7945b26d83424f3a010329ff2819a2ea3945
--- /dev/null
+++ b/frontend/src/components/visualizations/HeatmapView.css
@@ -0,0 +1,37 @@
+.heatmap-view {
+  padding: 1rem;
+  width: 100%;
+  height: 100%;
+  overflow: auto;
+}
+
+.heatmap-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  margin-bottom: 1rem;
+}
+
+.heatmap-header h3 {
+  margin: 0;
+  font-size: 1.25rem;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.heatmap-stats {
+  font-size: 0.9rem;
+  color: var(--text-secondary, #666);
+}
+
+.heatmap-svg {
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 8px;
+  background: var(--bg-primary, #ffffff);
+}
+
+.heatmap-empty {
+  padding: 2rem;
+  text-align: center;
+  color: var(--text-secondary, #666);
+}
+
diff --git a/frontend/src/components/visualizations/HeatmapView.tsx b/frontend/src/components/visualizations/HeatmapView.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..0674f531fdbcb2a1c6c0baea5e29b8897336d0e9
--- /dev/null
+++ b/frontend/src/components/visualizations/HeatmapView.tsx
@@ -0,0 +1,172 @@
+/**
+ * Heatmap view showing density of models in latent space.
+ * Uses D3.js for rendering.
+ */
+import React, { useMemo, useRef, useEffect } from 'react';
+import * as d3 from 'd3';
+import { ModelPoint } from '../../types';
+import './HeatmapView.css';
+
+interface HeatmapViewProps {
+  data: ModelPoint[];
+  width?: number;
+  height?: number;
+}
+
+export default function HeatmapView({ data, width = 800, height = 600 }: HeatmapViewProps) {
+  const svgRef = useRef<SVGSVGElement>(null);
+
+  const heatmapData = useMemo(() => {
+    if (data.length === 0) return null;
+
+    const gridSize = 50;
+    const grid: number[][] = Array(gridSize).fill(0).map(() => Array(gridSize).fill(0));
+
+    // Find bounds
+    const xValues = data.map(d => d.x);
+    const yValues = data.map(d => d.y);
+    const xMin = Math.min(...xValues);
+    const xMax = Math.max(...xValues);
+    const yMin = Math.min(...yValues);
+    const yMax = Math.max(...yValues);
+
+    // Populate grid
+    data.forEach(model => {
+      const x = Math.floor(((model.x - xMin) / (xMax - xMin)) * (gridSize - 1));
+      const y = Math.floor(((model.y - yMin) / (yMax - yMin)) * (gridSize - 1));
+      if (x >= 0 && x < gridSize && y >= 0 && y < gridSize) {
+        grid[y][x]++;
+      }
+    });
+
+    return { grid, xMin, xMax, yMin, yMax };
+  }, [data]);
+
+  useEffect(() => {
+    if (!heatmapData || !svgRef.current) return;
+
+    const svg = d3.select(svgRef.current);
+    svg.selectAll('*').remove();
+
+    const margin = { top: 20, right: 20, bottom: 40, left: 40 };
+    const innerWidth = width - margin.left - margin.right;
+    const innerHeight = height - margin.top - margin.bottom;
+
+    const g = svg.append('g')
+      .attr('transform', `translate(${margin.left},${margin.top})`);
+
+    const gridSize = heatmapData.grid.length;
+    const cellWidth = innerWidth / gridSize;
+    const cellHeight = innerHeight / gridSize;
+
+    const maxValue = Math.max(...heatmapData.grid.flat());
+    const colorScale = d3.scaleSequential(d3.interpolateViridis)
+      .domain([0, maxValue]);
+
+    // Create heatmap cells
+    heatmapData.grid.forEach((row, y) => {
+      row.forEach((value, x) => {
+        g.append('rect')
+          .attr('x', x * cellWidth)
+          .attr('y', y * cellHeight)
+          .attr('width', cellWidth)
+          .attr('height', cellHeight)
+          .attr('fill', colorScale(value))
+          .attr('stroke', 'none')
+          .append('title')
+          .text(`Density: ${value} models`);
+      });
+    });
+
+    // Add axes
+    const xScale = d3.scaleLinear()
+      .domain([heatmapData.xMin, heatmapData.xMax])
+      .range([0, innerWidth]);
+
+    const yScale = d3.scaleLinear()
+      .domain([heatmapData.yMin, heatmapData.yMax])
+      .range([innerHeight, 0]);
+
+    const xAxis = d3.axisBottom(xScale);
+    const yAxis = d3.axisLeft(yScale);
+
+    g.append('g')
+      .attr('transform', `translate(0,${innerHeight})`)
+      .call(xAxis)
+      .append('text')
+      .attr('x', innerWidth / 2)
+      .attr('y', 35)
+      .attr('fill', 'var(--text-primary, #1a1a1a)')
+      .style('text-anchor', 'middle')
+      .text('X Coordinate');
+
+    g.append('g')
+      .call(yAxis)
+      .append('text')
+      .attr('transform', 'rotate(-90)')
+      .attr('y', -30)
+      .attr('x', -innerHeight / 2)
+      .attr('fill', 'var(--text-primary, #1a1a1a)')
+      .style('text-anchor', 'middle')
+      .text('Y Coordinate');
+
+    // Add color legend
+    const legendWidth = 20;
+    const legendHeight = 200;
+    const legendX = innerWidth + 10;
+
+    const legendScale = d3.scaleLinear()
+      .domain([0, maxValue])
+      .range([legendHeight, 0]);
+
+    const legendAxis = d3.axisRight(legendScale).ticks(5);
+
+    const legendG = g.append('g')
+      .attr('transform', `translate(${legendX}, 0)`);
+
+    const defs = svg.append('defs');
+    const gradient = defs.append('linearGradient')
+      .attr('id', 'heatmap-gradient')
+      .attr('x1', '0%')
+      .attr('x2', '0%')
+      .attr('y1', '0%')
+      .attr('y2', '100%');
+
+    const numStops = 10;
+    for (let i = 0; i <= numStops; i++) {
+      const value = (i / numStops) * maxValue;
+      gradient.append('stop')
+        .attr('offset', `${(i / numStops) * 100}%`)
+        .attr('stop-color', colorScale(value));
+    }
+
+    legendG.append('rect')
+      .attr('width', legendWidth)
+      .attr('height', legendHeight)
+      .attr('fill', 'url(#heatmap-gradient)');
+
+    legendG.append('g')
+      .attr('transform', `translate(${legendWidth}, 0)`)
+      .call(legendAxis);
+
+  }, [heatmapData, width, height]);
+
+  if (!heatmapData) {
+    return (
+      <div className="heatmap-view">
+        <div className="heatmap-empty">No data to display</div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="heatmap-view">
+      <div className="heatmap-header">
+        <h3>Model Density Heatmap</h3>
+        <div className="heatmap-stats">Total Models: {data.length.toLocaleString()}</div>
+      </div>
+      <svg ref={svgRef} width={width} height={height} className="heatmap-svg" />
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/Histogram.tsx b/frontend/src/components/visualizations/Histogram.tsx
similarity index 98%
rename from frontend/src/components/Histogram.tsx
rename to frontend/src/components/visualizations/Histogram.tsx
index 23a959aa34d62f6a6d3ffb1e4f8283b315d6f556..d44ac6f960754613a746747acad018f1e2f29bff 100644
--- a/frontend/src/components/Histogram.tsx
+++ b/frontend/src/components/visualizations/Histogram.tsx
@@ -3,7 +3,7 @@
  */
 import React, { useMemo, useRef, useEffect } from 'react';
 import * as d3 from 'd3';
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 
 interface HistogramProps {
   width: number;
diff --git a/frontend/src/components/InstancedPoints.tsx b/frontend/src/components/visualizations/InstancedPoints.tsx
similarity index 80%
rename from frontend/src/components/InstancedPoints.tsx
rename to frontend/src/components/visualizations/InstancedPoints.tsx
index 2968cca97ad3a44801a16267e0432451fb73e5c5..e005cd2df613a53bc346a7a8a70c8ebd78ca0b3e 100644
--- a/frontend/src/components/InstancedPoints.tsx
+++ b/frontend/src/components/visualizations/InstancedPoints.tsx
@@ -5,7 +5,7 @@
 import React, { useRef, useMemo, useEffect } from 'react';
 import { useFrame, useThree } from '@react-three/fiber';
 import * as THREE from 'three';
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 
 interface InstancedPointsProps {
   points: ModelPoint[];
@@ -30,7 +30,7 @@ export default function InstancedPoints({
   const hoveredIndex = useRef<number | null>(null);
   const targetScales = useRef<Float32Array>(new Float32Array(points.length));
   const currentScales = useRef<Float32Array>(new Float32Array(points.length));
-  const { camera, raycaster: globalRaycaster } = useThree();
+  const { camera } = useThree();
 
   // Create geometry and material once
   const geometry = useMemo(() => new THREE.SphereGeometry(0.02, 12, 12), []);
@@ -38,11 +38,13 @@ export default function InstancedPoints({
     () =>
       new THREE.MeshStandardMaterial({
         color: 0xffffff, // White base color - required for vertexColors to work
-        metalness: 0.3, // Reduced for better color visibility
-        roughness: 0.7, // Increased for better color visibility
+        metalness: 0.2, // Reduced for better color visibility
+        roughness: 0.6, // Increased for better color visibility
         vertexColors: true, // Enable vertex colors for per-instance coloring
         transparent: true,
-        opacity: 0.9, // Increased base opacity for better visibility
+        opacity: 0.95, // Increased base opacity for better visibility
+        emissive: 0x000000,
+        emissiveIntensity: 0.1, // Slight emissive for better visibility
       }),
     []
   );
@@ -99,7 +101,6 @@ export default function InstancedPoints({
 
   // Track if updates are needed to avoid unnecessary work
   const needsUpdateRef = useRef(true);
-  const lastUpdateFrameRef = useRef(0);
   const frameSkipRef = useRef(0);
   
   // Mark as needing update when props change
@@ -113,14 +114,20 @@ export default function InstancedPoints({
 
     const mesh = meshRef.current;
     
-    // Skip frames for very large datasets to improve performance
-    // Update every frame for <10K points, every 2nd frame for 10K-50K, every 3rd for >50K
-    const frameSkip = points.length > 50000 ? 3 : points.length > 10000 ? 2 : 1;
+    // Adaptive frame skipping based on dataset size and movement
+    // More aggressive skipping for better performance, especially for large datasets
+    const frameSkip = points.length > 100000 ? 6 : points.length > 50000 ? 4 : points.length > 20000 ? 3 : points.length > 10000 ? 2 : 1;
     frameSkipRef.current++;
     if (frameSkipRef.current % frameSkip !== 0 && !needsUpdateRef.current) {
       return;
     }
     
+    // Batch updates - only process visible/important points per frame
+    // Smaller batches for smoother performance
+    const batchSize = points.length > 100000 ? 3000 : points.length > 50000 ? 5000 : points.length > 20000 ? 8000 : points.length;
+    const startIndex = (frameSkipRef.current % Math.ceil(points.length / batchSize)) * batchSize;
+    const endIndex = Math.min(startIndex + batchSize, points.length);
+    
     const matrix = new THREE.Matrix4();
     const scale = new THREE.Vector3(1, 1, 1);
     const position = new THREE.Vector3();
@@ -129,7 +136,8 @@ export default function InstancedPoints({
     let hasChanges = false;
     
     // Smooth scale transitions and update depth-based opacity
-    for (let i = 0; i < points.length; i++) {
+    // Process in batches for better performance
+    for (let i = startIndex; i < endIndex; i++) {
       const point = points[i];
       const isSelected = selectedModelId === point.model_id;
       const isFamilyMember = familyModelIds.has(point.model_id);
@@ -153,29 +161,24 @@ export default function InstancedPoints({
       
       // Only update color if selected/family state changed (optimization)
       // For large datasets, skip distance-based color updates to save performance
-      const shouldUpdateColor = points.length < 20000 || isSelected || isFamilyMember || hoveredIndex.current === i;
+      // More aggressive skipping for better performance
+      const shouldUpdateColor = points.length < 30000 || isSelected || isFamilyMember || hoveredIndex.current === i;
       
       if (shouldUpdateColor) {
-        // Calculate distance from camera for depth-based opacity (only for visible/important points)
-        position.set(point.x, point.y, point.z);
-        const distance = position.distanceTo(camera.position);
-        const maxDistance = 10;
-        const minDistance = 1;
-        const distanceFactor = Math.max(0.4, Math.min(1, 1 - (distance - minDistance) / (maxDistance - minDistance)));
-        
-        // Update color with distance-based brightness adjustment
+        // Update color with brightness adjustment
         color.set(colors[i]);
         if (isSelected) {
           color.set('#ffffff');
         } else if (isFamilyMember) {
           color.set('#4a4a4a');
         } else {
-          // Slightly brighten colors for better visibility
-          color.multiplyScalar(1.2);
-          // Clamp RGB values to [0, 1] range
-          color.r = Math.max(0, Math.min(1, color.r));
-          color.g = Math.max(0, Math.min(1, color.g));
-          color.b = Math.max(0, Math.min(1, color.b));
+          // Enhance color vibrancy for better visibility
+          const hsl = { h: 0, s: 0, l: 0 };
+          color.getHSL(hsl);
+          // Increase saturation and lightness slightly
+          hsl.s = Math.min(1, hsl.s * 1.15);
+          hsl.l = Math.min(0.9, hsl.l * 1.1);
+          color.setHSL(hsl.h, hsl.s, hsl.l);
         }
         mesh.setColorAt(i, color);
       }
@@ -187,12 +190,16 @@ export default function InstancedPoints({
       mesh.setMatrixAt(i, matrix);
     }
     
-    if (hasChanges || needsUpdateRef.current) {
+    // Only update if we processed all points or have critical changes
+    const processedAll = endIndex >= points.length;
+    if (hasChanges || needsUpdateRef.current || processedAll) {
       mesh.instanceMatrix.needsUpdate = true;
-      if (mesh.instanceColor && (needsUpdateRef.current || points.length < 20000)) {
+      if (mesh.instanceColor && (needsUpdateRef.current || processedAll || points.length < 50000)) {
         mesh.instanceColor.needsUpdate = true;
       }
-      needsUpdateRef.current = false;
+      if (processedAll) {
+        needsUpdateRef.current = false;
+      }
     }
 
     // Handle hover detection
diff --git a/frontend/src/components/NetworkGraph.tsx b/frontend/src/components/visualizations/NetworkGraph.tsx
similarity index 99%
rename from frontend/src/components/NetworkGraph.tsx
rename to frontend/src/components/visualizations/NetworkGraph.tsx
index 798e0163b10a8cea80a816ccccf0b357f774baf8..f5a2d0b7336a29f15eb2f867a2283c752034aad5 100644
--- a/frontend/src/components/NetworkGraph.tsx
+++ b/frontend/src/components/visualizations/NetworkGraph.tsx
@@ -4,7 +4,7 @@
  */
 import React, { useMemo, useRef, useEffect, useState } from 'react';
 import * as d3 from 'd3';
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 
 interface NetworkGraphProps {
   width: number;
diff --git a/frontend/src/components/ScatterPlot3D.tsx b/frontend/src/components/visualizations/ScatterPlot3D.tsx
similarity index 69%
rename from frontend/src/components/ScatterPlot3D.tsx
rename to frontend/src/components/visualizations/ScatterPlot3D.tsx
index d7547bf30f0b90292e95577e43a874715ebce490..bb4bcfcf63914e17014ac83ab57406b8ad8d21bc 100644
--- a/frontend/src/components/ScatterPlot3D.tsx
+++ b/frontend/src/components/visualizations/ScatterPlot3D.tsx
@@ -7,13 +7,14 @@ import React, { useMemo, useRef, useEffect, useState, useCallback, memo } from '
 import { Canvas, useFrame, useThree } from '@react-three/fiber';
 import { OrbitControls, PerspectiveCamera, Line } from '@react-three/drei';
 import * as THREE from 'three';
-import { ModelPoint } from '../types';
-import { getCategoricalColorMap, getContinuousColorScale, getModelColor } from '../utils/colors';
-import { createSpatialIndex, SpatialIndex } from '../utils/spatialIndex';
-import { filterVisiblePoints, adaptiveSampleByDistance, distanceToCamera } from '../utils/frustumCulling';
-import { applySpatialSparsity, getAdaptiveSparsityFactor, calculateAverageDistance } from '../utils/spatialSparsity';
+import { ModelPoint } from '../../types';
+import { getCategoricalColorMap, getContinuousColorScale } from '../../utils/rendering/colors';
+import { createSpatialIndex } from '../../utils/rendering/spatialIndex';
+import { filterVisiblePoints, adaptiveSampleByDistance } from '../../utils/rendering/frustumCulling';
+import { applySpatialSparsity, getAdaptiveSparsityFactor, calculateAverageDistance } from '../../utils/rendering/spatialSparsity';
+import { transformLayout } from '../../utils/rendering/layoutTransforms';
 import InstancedPoints from './InstancedPoints';
-import ColorLegend from './ColorLegend';
+import ColorLegend from '../ui/ColorLegend';
 
 interface ScatterPlot3DProps {
   width: number;
@@ -24,15 +25,22 @@ interface ScatterPlot3DProps {
   sizeBy: string;
   colorScheme?: 'viridis' | 'plasma' | 'inferno' | 'magma' | 'coolwarm';
   showLegend?: boolean;
+  showLabels?: boolean;
+  zoomLevel?: number;
+  nodeDensity?: number; // Percentage of nodes to render (10-100)
+  renderingStyle?: 'embeddings' | 'sphere' | 'galaxy' | 'wave' | 'helix' | 'torus';
   showNetworkEdges?: boolean;
   showStructuralGroups?: boolean;
   overviewMode?: boolean;
   networkEdgeType?: 'library' | 'pipeline' | 'combined';
   onPointClick?: (model: ModelPoint) => void;
   selectedModelId?: string | null;
+  selectedModel?: ModelPoint | null; // Full model object for distance calculations
   onViewChange?: (center: { x: number; y: number; z: number }) => void;
   onHover?: (model: ModelPoint | null, pointer?: { x: number; y: number }) => void;
-  targetViewCenter?: { x: number; y: number; z: number } | null; // Target position to animate to
+  targetViewCenter?: { x: number; y: number; z: number } | null;
+  highlightedPath?: string[]; // Model IDs in path to highlight
+  showDistanceHeatmap?: boolean; // Show distance visualization
 }
 
 interface PointProps {
@@ -42,12 +50,27 @@ interface PointProps {
   model: ModelPoint;
   isSelected: boolean;
   isFamilyMember: boolean;
+  isInPath: boolean;
+  distanceFromSelected?: number;
+  maxDistance?: number;
   onClick: () => void;
   onHover?: (model: ModelPoint | null, pointer?: { x: number; y: number }) => void;
 }
 
 // Memoized Point component with enhanced visual effects
-const Point = memo(function Point({ position, color, size, model, isSelected, isFamilyMember, onClick, onHover }: PointProps) {
+const Point = memo(function Point({ 
+  position, 
+  color, 
+  size, 
+  model, 
+  isSelected, 
+  isFamilyMember, 
+  isInPath,
+  distanceFromSelected,
+  maxDistance,
+  onClick, 
+  onHover 
+}: PointProps) {
   const meshRef = useRef<THREE.Mesh>(null);
   const glowRef = useRef<THREE.Mesh>(null);
   const outlineRef = useRef<THREE.Mesh>(null);
@@ -76,10 +99,10 @@ const Point = memo(function Point({ position, color, size, model, isSelected, is
     const minDistance = 1;
     const distanceFactor = Math.max(0.3, Math.min(1, 1 - (distance - minDistance) / (maxDistance - minDistance)));
     
-    // Update opacity based on distance
+    // Update opacity based on distance - Increased base opacity for better visibility
     if (meshRef.current.material instanceof THREE.MeshStandardMaterial) {
-      const baseOpacity = isSelected || isFamilyMember ? 1 : hovered ? 0.95 : 0.88;
-      meshRef.current.material.opacity = baseOpacity * distanceFactor;
+      const baseOpacity = isSelected || isFamilyMember ? 1 : hovered ? 0.98 : 0.95;
+      meshRef.current.material.opacity = Math.max(0.7, baseOpacity * distanceFactor);
     }
     
       // Subtle animation for selected/family members
@@ -164,13 +187,13 @@ const Point = memo(function Point({ position, color, size, model, isSelected, is
         frustumCulled={true}
       >
         <sphereGeometry args={[0.02, 12, 12]} />
-      <meshStandardMaterial
-        color={isSelected ? '#ffffff' : isFamilyMember ? '#4a4a4a' : color}
-        emissive={isSelected ? '#ffffff' : isFamilyMember ? '#6a6a6a' : '#000000'}
-          emissiveIntensity={isSelected ? 0.6 : isFamilyMember ? 0.2 : 0}
-          metalness={0.3}
-          roughness={0.7}
-          opacity={0.9}
+        <meshStandardMaterial
+        color={isSelected ? '#ffffff' : isInPath ? '#ff6b6b' : isFamilyMember ? '#4a4a4a' : color}
+        emissive={isSelected ? '#ffffff' : isInPath ? '#ff6b6b' : isFamilyMember ? '#6a6a6a' : color}
+          emissiveIntensity={isSelected ? 0.6 : isInPath ? 0.4 : isFamilyMember ? 0.2 : 0.15}
+          metalness={0.2}
+          roughness={0.6}
+          opacity={0.95}
         transparent
       />
     </mesh>
@@ -182,6 +205,8 @@ const Point = memo(function Point({ position, color, size, model, isSelected, is
     prevProps.model.model_id === nextProps.model.model_id &&
     prevProps.isSelected === nextProps.isSelected &&
     prevProps.isFamilyMember === nextProps.isFamilyMember &&
+    prevProps.isInPath === nextProps.isInPath &&
+    prevProps.distanceFromSelected === nextProps.distanceFromSelected &&
     prevProps.color === nextProps.color &&
     prevProps.size === nextProps.size &&
     prevProps.position[0] === nextProps.position[0] &&
@@ -268,32 +293,43 @@ const SceneContent = memo(function SceneContent({
   colorBy,
   sizeBy,
   colorScheme = 'viridis',
+  showLabels = false,
+  nodeDensity = 100,
+  renderingStyle = 'embeddings',
   showNetworkEdges = false,
   showStructuralGroups = false,
   overviewMode = false,
   networkEdgeType = 'combined',
   onPointClick,
   selectedModelId,
+  selectedModel,
   onHover,
   isInteracting = false,
-}: Omit<ScatterPlot3DProps, 'width' | 'height' | 'showLegend'> & { isInteracting?: boolean }) {
+  highlightedPath = [],
+  showDistanceHeatmap = false,
+}: Omit<ScatterPlot3DProps, 'width' | 'height' | 'showLegend' | 'onViewChange' | 'targetViewCenter' | 'zoomLevel'> & { isInteracting?: boolean }) {
   const { camera, gl } = useThree();
   const [useInstancedRendering, setUseInstancedRendering] = useState(false);
   const cameraPositionRef = useRef<THREE.Vector3>(new THREE.Vector3());
   const lastCameraPositionRef = useRef<THREE.Vector3>(new THREE.Vector3());
   const movementSpeedRef = useRef<number>(0);
 
-  // Track camera movement for adaptive quality
+  // Track camera movement for adaptive quality with throttling
+  const frameCountRef = useRef(0);
   useFrame(() => {
     if (camera) {
-      camera.getWorldPosition(cameraPositionRef.current);
-      const movement = cameraPositionRef.current.distanceTo(lastCameraPositionRef.current);
-      movementSpeedRef.current = movement;
-      lastCameraPositionRef.current.copy(cameraPositionRef.current);
-      
-      // Use instanced rendering for large datasets (more efficient for >5K points)
-      // Always use for datasets > 10K, or when moving fast with >5K points
-      setUseInstancedRendering(data.length > 5000 || (data.length > 1000 && movementSpeedRef.current > 0.01));
+      frameCountRef.current++;
+      // Only check movement every 3rd frame to reduce overhead
+      if (frameCountRef.current % 3 === 0) {
+        camera.getWorldPosition(cameraPositionRef.current);
+        const movement = cameraPositionRef.current.distanceTo(lastCameraPositionRef.current);
+        movementSpeedRef.current = movement;
+        lastCameraPositionRef.current.copy(cameraPositionRef.current);
+        
+        // Use instanced rendering for large datasets (more efficient for >5K points)
+        // Always use for datasets > 10K, or when moving fast with >5K points
+        setUseInstancedRendering(data.length > 5000 || (data.length > 1000 && movementSpeedRef.current > 0.01));
+      }
     }
   });
 
@@ -308,13 +344,18 @@ const SceneContent = memo(function SceneContent({
   const sampledData = useMemo(() => {
     if (data.length === 0) return [];
     
+    // Apply node density filter first
+    const densityFilteredData = nodeDensity < 100 
+      ? data.filter((_, idx) => (idx % Math.ceil(100 / nodeDensity)) === 0)
+      : data;
+    
     // Keep all family tree members and selected models
     const familyIds = new Set(familyTree?.map(m => m.model_id) || []);
     const importantIds = new Set<string>();
     const important: ModelPoint[] = [];
     const others: ModelPoint[] = [];
     
-    for (const d of data) {
+    for (const d of densityFilteredData) {
       if (familyIds.has(d.model_id) || selectedModelId === d.model_id) {
         important.push(d);
         importantIds.add(d.model_id);
@@ -325,47 +366,46 @@ const SceneContent = memo(function SceneContent({
 
     // For very large datasets, use spatial indexing and camera-based culling
     // Use instanced rendering for datasets > 10K points
-    if (data.length > 10000 && spatialIndex && camera && gl) {
+    if (densityFilteredData.length > 10000 && spatialIndex && camera && gl) {
       // Use adaptive sampling based on distance from camera
-      // When moving fast, reduce quality for better performance
-      const qualityFactor = isInteracting && movementSpeedRef.current > 0.01 ? 0.7 : 1.0; // Increased from 0.6
-      const maxDistance = 20 * qualityFactor; // Increased view distance from 15 to 20
+      // When moving fast, reduce quality more aggressively for better performance
+      const qualityFactor = isInteracting && movementSpeedRef.current > 0.01 ? 0.4 : 0.7; // More aggressive reduction when interacting
+      const maxDistance = 15 * qualityFactor; // Reduced view distance for better performance
       
-      // Improved sampling strategy to show more models while maintaining performance
-      // Use higher sample rates to better represent the full dataset
+      // More aggressive sampling strategy for smoother performance
       let distanceSampled: ModelPoint[];
       if (others.length > 400000) {
-        // For extremely large datasets (>400K), sample 30% (increased from 15%)
-        const sampleRate = qualityFactor * 0.3;
+        // For extremely large datasets (>400K), sample 15% (reduced from 30%)
+        const sampleRate = qualityFactor * 0.15;
         const step = Math.ceil(1 / sampleRate);
         distanceSampled = [];
         for (let i = 0; i < others.length; i += step) {
           distanceSampled.push(others[i]);
         }
       } else if (others.length > 200000) {
-        // For very large datasets (200K-400K), sample 40% (increased from 15%)
-        const sampleRate = qualityFactor * 0.4;
+        // For very large datasets (200K-400K), sample 20% (reduced from 40%)
+        const sampleRate = qualityFactor * 0.2;
         const step = Math.ceil(1 / sampleRate);
         distanceSampled = [];
         for (let i = 0; i < others.length; i += step) {
           distanceSampled.push(others[i]);
         }
       } else if (others.length > 100000) {
-        // For large datasets (100K-200K), sample 50% (increased from 20%)
-        const sampleRate = qualityFactor * 0.5;
+        // For large datasets (100K-200K), sample 30% (reduced from 50%)
+        const sampleRate = qualityFactor * 0.3;
         const step = Math.ceil(1 / sampleRate);
         distanceSampled = [];
         for (let i = 0; i < others.length; i += step) {
           distanceSampled.push(others[i]);
         }
       } else {
-        // Use adaptive sampling with higher rate for better representation
-        distanceSampled = adaptiveSampleByDistance(others, camera, qualityFactor * 0.85, maxDistance); // Increased from 0.7
+        // Use adaptive sampling with reduced rate for better performance
+        distanceSampled = adaptiveSampleByDistance(others, camera, qualityFactor * 0.6, maxDistance); // Reduced from 0.85
       }
       
       // Apply frustum culling if camera is available
-      // Increased limit for instanced rendering (can handle more with better sampling)
-      const maxVisible = Math.min(distanceSampled.length, 200000); // Increased from 100K to 200K
+      // Reduced limit for smoother performance
+      const maxVisible = Math.min(distanceSampled.length, isInteracting ? 50000 : 100000); // Much lower when interacting
       let visible: ModelPoint[];
       try {
         visible = filterVisiblePoints(
@@ -398,20 +438,20 @@ const SceneContent = memo(function SceneContent({
     }
     
     // For smaller datasets, use simple sampling with sparsity
-    // Increased render limit to show more models
-    const renderLimit = data.length > 200000 ? 200000 : data.length; // Increased from 100K to 200K
-    if (data.length <= renderLimit) {
+    // Reduced render limit for smoother performance
+    const renderLimit = densityFilteredData.length > 100000 ? (isInteracting ? 50000 : 100000) : densityFilteredData.length; // Lower when interacting
+    if (densityFilteredData.length <= renderLimit) {
       // Still apply sparsity even if under limit for better navigability
       // But be less aggressive to show more models
-      if (data.length > 5000) { // Increased threshold from 3000
-        const avgDistance = calculateAverageDistance(data);
-        const sparsityFactor = getAdaptiveSparsityFactor(data.length) * 1.2; // Reduced from 1.5
+      if (densityFilteredData.length > 5000) { // Increased threshold from 3000
+        const avgDistance = calculateAverageDistance(densityFilteredData);
+        const sparsityFactor = getAdaptiveSparsityFactor(densityFilteredData.length) * 1.2; // Reduced from 1.5
         const minDistance = avgDistance * sparsityFactor;
         if (minDistance > 0) {
-          return applySpatialSparsity(data, minDistance, importantIds);
+          return applySpatialSparsity(densityFilteredData, minDistance, importantIds);
         }
       }
-      return data;
+      return densityFilteredData;
     }
     
     // Sample from others, keep all important
@@ -441,7 +481,7 @@ const SceneContent = memo(function SceneContent({
     }
     
     return combined;
-  }, [data, familyTree, selectedModelId, spatialIndex, camera, gl, isInteracting]);
+  }, [data, nodeDensity, familyTree, selectedModelId, spatialIndex, camera, gl, isInteracting]);
 
   // Cache scales to avoid recalculation
   const scalesCacheRef = useRef<{
@@ -452,13 +492,14 @@ const SceneContent = memo(function SceneContent({
     scales: any;
   } | null>(null);
 
-  const { xScale, yScale, zScale, colorScale, sizeScale, familyMap } = useMemo(() => {
+  const { xScale, yScale, zScale, colorScale, sizeScale, familyMap, pathSet } = useMemo(() => {
     // Return cached scales if inputs haven't changed
     if (scalesCacheRef.current &&
         scalesCacheRef.current.dataLength === sampledData.length &&
         scalesCacheRef.current.colorBy === colorBy &&
         scalesCacheRef.current.sizeBy === sizeBy &&
-        scalesCacheRef.current.colorScheme === colorScheme) {
+        scalesCacheRef.current.colorScheme === colorScheme &&
+        sampledData.length > 0) {
       return scalesCacheRef.current.scales;
     }
     if (sampledData.length === 0) {
@@ -472,18 +513,35 @@ const SceneContent = memo(function SceneContent({
       };
     }
 
-    const xExtent = [Math.min(...sampledData.map(d => d.x)), Math.max(...sampledData.map(d => d.x))] as [number, number];
-    const yExtent = [Math.min(...sampledData.map(d => d.y)), Math.max(...sampledData.map(d => d.y))] as [number, number];
-    const zExtent = [Math.min(...sampledData.map(d => d.z)), Math.max(...sampledData.map(d => d.z))] as [number, number];
+    // Optimize extent calculation with single pass (faster than multiple map operations)
+    let xMin = Infinity, xMax = -Infinity;
+    let yMin = Infinity, yMax = -Infinity;
+    let zMin = Infinity, zMax = -Infinity;
+    
+    for (let i = 0; i < sampledData.length; i++) {
+      const d = sampledData[i];
+      if (d.x < xMin) xMin = d.x;
+      if (d.x > xMax) xMax = d.x;
+      if (d.y < yMin) yMin = d.y;
+      if (d.y > yMax) yMax = d.y;
+      if (d.z < zMin) zMin = d.z;
+      if (d.z > zMax) zMax = d.z;
+    }
+    
+    const xExtent = [xMin, xMax] as [number, number];
+    const yExtent = [yMin, yMax] as [number, number];
+    const zExtent = [zMin, zMax] as [number, number];
 
-    // Normalize to [-1, 1] range for better 3D visualization
+    // Normalize to [-1.5, 1.5] range for better 3D visualization with more space
     const xRange = xExtent[1] - xExtent[0] || 1;
     const yRange = yExtent[1] - yExtent[0] || 1;
     const zRange = zExtent[1] - zExtent[0] || 1;
 
-    const xScale = (x: number) => ((x - xExtent[0]) / xRange - 0.5) * 2;
-    const yScale = (y: number) => ((y - yExtent[0]) / yRange - 0.5) * 2;
-    const zScale = (z: number) => ((z - zExtent[0]) / zRange - 0.5) * 2;
+    // Scale to slightly larger range for better visibility
+    const scaleFactor = 1.5;
+    const xScale = (x: number) => ((x - xExtent[0]) / xRange - 0.5) * 2 * scaleFactor;
+    const yScale = (y: number) => ((y - yExtent[0]) / yRange - 0.5) * 2 * scaleFactor;
+    const zScale = (z: number) => ((z - zExtent[0]) / zRange - 0.5) * 2 * scaleFactor;
 
     // Color scale with improved color schemes
     const isCategorical = colorBy === 'library_name' || colorBy === 'pipeline_tag' || colorBy === 'cluster_id';
@@ -491,14 +549,14 @@ const SceneContent = memo(function SceneContent({
 
     if (colorBy === 'cluster_id') {
       // Color by cluster - use distinct colors for each cluster
-      const clusters = Array.from(new Set(sampledData.map(d => d.cluster_id).filter(id => id !== null))) as number[];
+      const clusters = Array.from(new Set(sampledData.map((d: ModelPoint) => d.cluster_id).filter((id: number | null): id is number => id !== null))) as number[];
       const colorMap = getCategoricalColorMap(clusters.map(String), 'default');
       colorScale = (d: ModelPoint) => {
         return d.cluster_id !== null ? colorMap.get(String(d.cluster_id)) || '#808080' : '#808080';
       };
     } else if (colorBy === 'family_depth') {
       // Color by family depth - use sequential color scale (darker = deeper)
-      const depths = sampledData.map(d => d.family_depth ?? 0);
+      const depths = sampledData.map((d: ModelPoint) => d.family_depth ?? 0);
       const maxDepth = Math.max(...depths, 1);
       const continuousScale = getContinuousColorScale(0, maxDepth, colorScheme);
       colorScale = (d: ModelPoint) => {
@@ -507,7 +565,7 @@ const SceneContent = memo(function SceneContent({
       };
     } else if (colorBy === 'licenses') {
       // Color by license type (categorical)
-      const licenses = Array.from(new Set(sampledData.map(d => {
+      const licenses = Array.from(new Set(sampledData.map((d: ModelPoint) => {
         if (!d.licenses) return 'No License';
         const licenseStr = d.licenses.toString();
         // Extract first license from string
@@ -522,7 +580,7 @@ const SceneContent = memo(function SceneContent({
           return licenseStr.split(',')[0].trim() || 'No License';
         }
       })));
-      const colorMap = getCategoricalColorMap(licenses, 'default');
+      const colorMap = getCategoricalColorMap(licenses as string[], 'default');
       colorScale = (d: ModelPoint) => {
         if (!d.licenses) return colorMap.get('No License') || '#808080';
         const licenseStr = d.licenses.toString();
@@ -542,7 +600,7 @@ const SceneContent = memo(function SceneContent({
       };
     } else if (colorBy === 'trending_score') {
       // Color by trending score
-      const scores = sampledData.map(d => d.trending_score ?? 0).filter(s => s !== null);
+      const scores = sampledData.map((d: ModelPoint) => d.trending_score ?? 0).filter((s: number | null): s is number => s !== null);
       if (scores.length > 0) {
         const min = Math.min(...scores);
         const max = Math.max(...scores);
@@ -555,18 +613,18 @@ const SceneContent = memo(function SceneContent({
         colorScale = () => '#808080';
       }
     } else if (isCategorical) {
-      const categories = Array.from(new Set(sampledData.map(d => {
+      const categories = Array.from(new Set(sampledData.map((d: ModelPoint) => {
         if (colorBy === 'library_name') return d.library_name || 'unknown';
         return d.pipeline_tag || 'unknown';
       })));
       const colorScheme = colorBy === 'library_name' ? 'library' : 'pipeline';
-      const colorMap = getCategoricalColorMap(categories, colorScheme);
+      const colorMap = getCategoricalColorMap(categories as string[], colorScheme);
       colorScale = (d: ModelPoint) => {
         const val = colorBy === 'library_name' ? d.library_name : d.pipeline_tag;
         return colorMap.get(val || 'unknown') || '#808080';
       };
     } else {
-      const values = sampledData.map(d => colorBy === 'downloads' ? d.downloads : d.likes);
+      const values = sampledData.map((d: ModelPoint) => colorBy === 'downloads' ? d.downloads : d.likes);
       const min = Math.min(...values);
       const max = Math.max(...values);
       // Use logarithmic scaling for downloads/likes (heavily skewed distributions)
@@ -580,7 +638,7 @@ const SceneContent = memo(function SceneContent({
     }
 
     // Size scale with logarithmic scaling for better representation of skewed distributions
-    const sizeValues = sampledData.map(d => {
+    const sizeValues = sampledData.map((d: ModelPoint) => {
       if (sizeBy === 'downloads') return d.downloads;
       if (sizeBy === 'likes') return d.likes;
       return 1;
@@ -614,7 +672,10 @@ const SceneContent = memo(function SceneContent({
       });
     }
 
-    const scales = { xScale, yScale, zScale, colorScale, sizeScale, familyMap };
+    // Path set for highlighted path
+    const pathSet = new Set<string>(highlightedPath || []);
+
+    const scales = { xScale, yScale, zScale, colorScale, sizeScale, familyMap, pathSet };
     
     // Cache the scales
     scalesCacheRef.current = {
@@ -626,7 +687,7 @@ const SceneContent = memo(function SceneContent({
     };
     
     return scales;
-  }, [sampledData, familyTree, colorBy, sizeBy, colorScheme]);
+  }, [sampledData, familyTree, colorBy, sizeBy, colorScheme, highlightedPath]);
 
   // Build family edges with color coding by depth
   const familyEdges = useMemo(() => {
@@ -681,13 +742,12 @@ const SceneContent = memo(function SceneContent({
       type: string;
     }> = [];
     
-    // Create a map for quick lookups
-    const modelMap = new Map(sampledData.map(m => [m.model_id, m]));
+    // Model map removed - not currently used
     
     // Group models by library, pipeline, or both
     const groups = new Map<string, ModelPoint[]>();
     
-    sampledData.forEach(model => {
+    sampledData.forEach((model: ModelPoint) => {
       if (networkEdgeType === 'library' || networkEdgeType === 'combined') {
         const key = `lib:${model.library_name || 'unknown'}`;
         if (!groups.has(key)) groups.set(key, []);
@@ -756,7 +816,7 @@ const SceneContent = memo(function SceneContent({
     
     // Group by library
     const libraryGroups = new Map<string, ModelPoint[]>();
-    sampledData.forEach(model => {
+    sampledData.forEach((model: ModelPoint) => {
       const lib = model.library_name || 'unknown';
       if (!libraryGroups.has(lib)) libraryGroups.set(lib, []);
       libraryGroups.get(lib)!.push(model);
@@ -764,7 +824,7 @@ const SceneContent = memo(function SceneContent({
     
     // Group by pipeline
     const pipelineGroups = new Map<string, ModelPoint[]>();
-    sampledData.forEach(model => {
+    sampledData.forEach((model: ModelPoint) => {
       const pipe = model.pipeline_tag || 'unknown';
       if (!pipelineGroups.has(pipe)) pipelineGroups.set(pipe, []);
       pipelineGroups.get(pipe)!.push(model);
@@ -818,6 +878,25 @@ const SceneContent = memo(function SceneContent({
     return groups;
   }, [showStructuralGroups, sampledData, overviewMode, xScale, yScale, zScale]);
 
+  // Calculate distance map for heatmap visualization
+  const { distanceMap, maxDistance } = useMemo(() => {
+    const map = new Map<string, number>();
+    let max = 0;
+    
+    if (showDistanceHeatmap && selectedModel) {
+      sampledData.forEach((model: ModelPoint) => {
+        const dx = model.x - selectedModel.x;
+        const dy = model.y - selectedModel.y;
+        const dz = model.z - selectedModel.z;
+        const distance = Math.sqrt(dx * dx + dy * dy + dz * dz);
+        map.set(model.model_id, distance);
+        max = Math.max(max, distance);
+      });
+    }
+    
+    return { distanceMap: map, maxDistance: max || 1 };
+  }, [showDistanceHeatmap, selectedModel, sampledData]);
+
   // Adjust camera for overview mode
   useEffect(() => {
     if (!camera) return;
@@ -859,12 +938,13 @@ const SceneContent = memo(function SceneContent({
 
   return (
     <>
-      <ambientLight intensity={0.5} />
-      <pointLight position={[10, 10, 10]} intensity={1} />
-      <pointLight position={[-10, -10, -10]} intensity={0.5} />
+      <ambientLight intensity={0.6} />
+      <pointLight position={[10, 10, 10]} intensity={1.2} />
+      <pointLight position={[-10, -10, -10]} intensity={0.6} />
+      <directionalLight position={[5, 5, 5]} intensity={0.8} />
 
       {/* Grid for orientation - using custom grid to avoid deprecation warnings */}
-      <gridHelper args={[10, 10, '#6a6a6a', '#4a4a4a']} />
+      <gridHelper args={[15, 15, '#9ca3af', '#d1d5db']} />
 
       {/* Network edges (co-occurrence relationships) */}
       {networkEdges.length > 0 && (
@@ -939,33 +1019,68 @@ const SceneContent = memo(function SceneContent({
       {/* Data points - use instanced rendering for large datasets */}
       {useInstancedRendering && sampledData.length > 1000 ? (
         <InstancedPoints
-          points={sampledData.map(m => ({
-            ...m,
-            x: xScale(m.x),
-            y: yScale(m.y),
-            z: zScale(m.z),
-          }))}
-          colors={sampledData.map(m => colorScale(m))}
-          sizes={sampledData.map(m => sizeScale(m))}
+          points={sampledData.map((m: ModelPoint, idx: number) => {
+            const [tx, ty, tz] = renderingStyle !== 'embeddings' 
+              ? transformLayout(m, renderingStyle, idx, sampledData.length)
+              : [xScale(m.x), yScale(m.y), zScale(m.z)];
+            return {
+              ...m,
+              x: tx,
+              y: ty,
+              z: tz,
+            };
+          })}
+          colors={sampledData.map((m: ModelPoint) => {
+            let color = colorScale(m);
+            if (showDistanceHeatmap && selectedModel) {
+              const dist = distanceMap.get(m.model_id);
+              if (dist !== undefined) {
+                const normalizedDist = dist / maxDistance;
+                const heatmapIntensity = 1 - normalizedDist;
+                color = `hsl(${240 - heatmapIntensity * 120}, 70%, ${50 + heatmapIntensity * 30}%)`;
+              }
+            }
+            return color;
+          })}
+          sizes={sampledData.map((m: ModelPoint) => sizeScale(m))}
           selectedModelId={selectedModelId}
-          familyModelIds={new Set(familyTree?.map(m => m.model_id) || [])}
+          familyModelIds={new Set([
+            ...(familyTree?.map(m => m.model_id) || []),
+            ...highlightedPath
+          ])}
           onPointClick={onPointClick}
           onHover={onHover}
         />
       ) : (
-        sampledData.map((model) => {
+        sampledData.map((model: ModelPoint) => {
         const isFamilyMember = familyMap.has(model.model_id);
         const isSelected = selectedModelId === model.model_id;
+        const isInPath = pathSet.has(model.model_id);
+        const distanceFromSelected = distanceMap.get(model.model_id);
+        
+        let finalColor = colorScale(model);
+        if (showDistanceHeatmap && distanceFromSelected !== undefined && selectedModel) {
+          const normalizedDist = distanceFromSelected / maxDistance;
+          const heatmapIntensity = 1 - normalizedDist;
+          finalColor = `hsl(${240 - heatmapIntensity * 120}, 70%, ${50 + heatmapIntensity * 30}%)`;
+        }
+        
+        const [tx, ty, tz] = renderingStyle !== 'embeddings'
+          ? transformLayout(model, renderingStyle, sampledData.indexOf(model), sampledData.length)
+          : [xScale(model.x), yScale(model.y), zScale(model.z)];
         
         return (
           <Point
             key={model.model_id}
-            position={[xScale(model.x), yScale(model.y), zScale(model.z)]}
-            color={colorScale(model)}
+            position={[tx, ty, tz]}
+            color={finalColor}
             size={sizeScale(model)}
             model={model}
             isSelected={isSelected}
             isFamilyMember={isFamilyMember}
+            isInPath={isInPath}
+            distanceFromSelected={distanceFromSelected}
+            maxDistance={maxDistance}
             onClick={() => onPointClick?.(model)}
             onHover={onHover}
           />
@@ -994,6 +1109,39 @@ const SceneContent = memo(function SceneContent({
   );
 });
 
+// Component to handle WebGL context loss
+function WebGLContextHandler({ onContextLost, onContextRestored }: { 
+  onContextLost: () => void;
+  onContextRestored: () => void;
+}) {
+  const { gl } = useThree();
+  
+  useEffect(() => {
+    const canvas = gl.domElement;
+    
+    const handleContextLost = (event: Event) => {
+      event.preventDefault();
+      console.warn('WebGL context lost. Attempting recovery...');
+      onContextLost();
+    };
+    
+    const handleContextRestored = () => {
+      console.log('WebGL context restored.');
+      onContextRestored();
+    };
+    
+    canvas.addEventListener('webglcontextlost', handleContextLost);
+    canvas.addEventListener('webglcontextrestored', handleContextRestored);
+    
+    return () => {
+      canvas.removeEventListener('webglcontextlost', handleContextLost);
+      canvas.removeEventListener('webglcontextrestored', handleContextRestored);
+    };
+  }, [gl, onContextLost, onContextRestored]);
+  
+  return null;
+}
+
 // Component to track interaction state
 function InteractionTracker({ 
   controlsRef, 
@@ -1049,6 +1197,10 @@ export default function ScatterPlot3D({
   sizeBy,
   colorScheme = 'viridis',
   showLegend = true,
+  showLabels = false,
+  zoomLevel = 1,
+  nodeDensity = 100,
+  renderingStyle = 'embeddings',
   showNetworkEdges = false,
   showStructuralGroups = false,
   overviewMode = false,
@@ -1058,10 +1210,14 @@ export default function ScatterPlot3D({
   onViewChange,
   onHover,
   targetViewCenter,
+  highlightedPath = [],
+  showDistanceHeatmap = false,
 }: ScatterPlot3DProps) {
   const cameraRef = useRef<THREE.PerspectiveCamera>(null);
   const controlsRef = useRef<any>(null);
   const [isInteracting, setIsInteracting] = useState(false);
+  const [contextLost, setContextLost] = useState(false);
+  const [renderKey, setRenderKey] = useState(0);
   const previousTargetRef = useRef<{ x: number; y: number; z: number } | null>(null);
 
   // Animate camera to target view center when it changes
@@ -1083,13 +1239,15 @@ export default function ScatterPlot3D({
     const camera = cameraRef.current;
     
     // Calculate camera position relative to target
-    // Position camera at a good viewing distance from the target
-    const distance = 3; // Distance from target
+    // Position camera at optimal viewing distance from the target
+    const distance = 4.5; // Increased distance for better overview
     const target = new THREE.Vector3(targetViewCenter.x, targetViewCenter.y, targetViewCenter.z);
+    // Use a more natural viewing angle (45 degrees)
+    const angle = Math.PI / 4;
     const cameraPosition = new THREE.Vector3(
-      target.x + distance,
-      target.y + distance,
-      target.z + distance
+      target.x + distance * Math.cos(angle),
+      target.y + distance * Math.sin(angle),
+      target.z + distance * Math.cos(angle)
     );
     
     // Smoothly animate to target
@@ -1120,11 +1278,18 @@ export default function ScatterPlot3D({
     animate();
   }, [targetViewCenter]);
 
-  // Update view center when camera changes
+  // Update view center when camera changes (throttled for performance)
   useEffect(() => {
     if (!cameraRef.current || !onViewChange) return;
 
+    let lastUpdate = 0;
+    const throttleMs = 200; // Update every 200ms instead of 100ms
+
     const updateViewCenter = () => {
+      const now = Date.now();
+      if (now - lastUpdate < throttleMs) return;
+      lastUpdate = now;
+
       if (cameraRef.current && controlsRef.current) {
         // Get the orbit controls target (center of view)
         const target = controlsRef.current.target;
@@ -1137,43 +1302,145 @@ export default function ScatterPlot3D({
       }
     };
 
-    // Update on camera changes
-    const interval = setInterval(updateViewCenter, 100);
+    // Update on camera changes with throttling (increased throttle for better performance)
+    const interval = setInterval(updateViewCenter, throttleMs * 2); // Double throttle time
     return () => clearInterval(interval);
   }, [onViewChange]);
 
+  // Handle WebGL context loss and recovery
+  const handleContextLost = useCallback(() => {
+    setContextLost(true);
+  }, []);
+
+  const handleContextRestored = useCallback(() => {
+    setContextLost(false);
+    // Force re-render by updating key
+    setRenderKey(prev => prev + 1);
+  }, []);
+
+  // Reduce data size if context was lost to prevent further issues
+  // Also preemptively limit very large datasets to prevent context loss
+  const safeData = useMemo(() => {
+    // If context was lost, aggressively reduce to prevent further issues
+    if (contextLost && data.length > 50000) {
+      // Reduce to 50K points if context was lost
+      return data.slice(0, 50000);
+    }
+    
+    // Preemptively limit extremely large datasets (>500K) to prevent GPU memory issues
+    // This helps prevent WebGL context loss before it happens
+    if (data.length > 500000) {
+      // Sample down to 300K points for very large datasets
+      const step = Math.ceil(data.length / 300000);
+      const sampled: ModelPoint[] = [];
+      for (let i = 0; i < data.length; i += step) {
+        sampled.push(data[i]);
+      }
+      return sampled;
+    }
+    
+    return data;
+  }, [data, contextLost]);
+
   return (
     <div style={{ width, height, background: '#ffffff', position: 'relative' }}>
-      {showLegend && data.length > 0 && (
+      {contextLost && (
+        <div
+          style={{
+            position: 'absolute',
+            top: 10,
+            left: 10,
+            right: 10,
+            zIndex: 1000,
+            backgroundColor: '#fff3cd',
+            border: '2px solid #ffc107',
+            borderRadius: '4px',
+            padding: '12px',
+            fontSize: '14px',
+            color: '#856404',
+            fontFamily: "'Instrument Sans', sans-serif",
+            boxShadow: '0 2px 8px rgba(0,0,0,0.2)',
+          }}
+        >
+          <strong>⚠️ WebGL Context Lost</strong>
+          <div style={{ marginTop: '8px', fontSize: '12px' }}>
+            The 3D visualization encountered a GPU memory issue. The view has been reduced to {safeData.length.toLocaleString()} points to prevent further issues.
+            {data.length > safeData.length && (
+              <div style={{ marginTop: '4px' }}>
+                Showing {safeData.length.toLocaleString()} of {data.length.toLocaleString()} models. Try switching to 2D view or applying filters to reduce the dataset size.
+              </div>
+            )}
+          </div>
+        </div>
+      )}
+      {showLegend && safeData.length > 0 && (
         <ColorLegend 
           colorBy={colorBy} 
-          data={data} 
+          data={safeData} 
           position="top-right"
         />
       )}
       <Canvas
-        camera={{ position: [3, 3, 3], fov: 50 }}
-        gl={{ antialias: !isInteracting, alpha: true }} // Disable antialiasing when interacting for performance
-        performance={{ min: 0.5 }} // Target 50% performance budget
+        key={renderKey}
+        camera={{ position: [4, 4, 4], fov: 60 }}
+        gl={{ 
+          antialias: !isInteracting, 
+          alpha: true,
+          powerPreference: "high-performance",
+          preserveDrawingBuffer: false,
+          failIfMajorPerformanceCaveat: false,
+        }}
+        performance={{ min: isInteracting ? 0.3 : 0.5 }} // Lower performance target when interacting
+        onCreated={({ camera }) => {
+          // Set optimal initial camera position
+          if (safeData.length > 0) {
+            // Calculate center of data
+            let sumX = 0, sumY = 0, sumZ = 0;
+            const sampleSize = Math.min(1000, safeData.length);
+            for (let i = 0; i < sampleSize; i++) {
+              sumX += safeData[i].x;
+              sumY += safeData[i].y;
+              sumZ += safeData[i].z;
+            }
+            const centerX = sumX / sampleSize;
+            const centerY = sumY / sampleSize;
+            const centerZ = sumZ / sampleSize;
+            
+            // Position camera at optimal distance
+            const distance = 5;
+            camera.position.set(centerX + distance, centerY + distance, centerZ + distance);
+            camera.lookAt(centerX, centerY, centerZ);
+          }
+        }}
       >
-        <PerspectiveCamera makeDefault ref={cameraRef} position={[3, 3, 3]} fov={50} />
+        <WebGLContextHandler 
+          onContextLost={handleContextLost}
+          onContextRestored={handleContextRestored}
+        />
+        <PerspectiveCamera makeDefault ref={cameraRef} position={[4, 4, 4]} fov={60} />
         <OrbitControls
           ref={controlsRef}
           enablePan={true}
           enableZoom={true}
           enableRotate={true}
-          minDistance={1}
-          maxDistance={overviewMode ? 15 : 10}
+          minDistance={0.5 / zoomLevel}
+          maxDistance={(overviewMode ? 20 : 15) * zoomLevel}
           enableDamping={true}
           dampingFactor={0.05}
+          zoomSpeed={1.2 * zoomLevel}
+          panSpeed={0.8}
+          rotateSpeed={0.8}
         />
         <InteractionTracker controlsRef={controlsRef} onInteractionChange={setIsInteracting} />
         <SceneContent
-          data={data}
+          data={safeData}
           familyTree={familyTree}
           colorBy={colorBy}
           sizeBy={sizeBy}
           colorScheme={colorScheme}
+          showLabels={showLabels}
+          nodeDensity={nodeDensity}
+          renderingStyle={renderingStyle}
           showNetworkEdges={showNetworkEdges}
           showStructuralGroups={showStructuralGroups}
           overviewMode={overviewMode}
@@ -1182,6 +1449,8 @@ export default function ScatterPlot3D({
           selectedModelId={selectedModelId}
           onHover={onHover}
           isInteracting={isInteracting}
+          highlightedPath={highlightedPath}
+          showDistanceHeatmap={showDistanceHeatmap}
         />
       </Canvas>
       <div
@@ -1195,7 +1464,7 @@ export default function ScatterPlot3D({
           padding: '4px 8px',
           borderRadius: '2px',
           border: '1px solid #d0d0d0',
-          fontFamily: "'Vend Sans', sans-serif",
+          fontFamily: "'Instrument Sans', sans-serif",
         }}
       >
         <strong>3D Navigation:</strong> Click + drag to rotate | Scroll to zoom | Right-click + drag to pan
@@ -1212,7 +1481,7 @@ export default function ScatterPlot3D({
             padding: '6px 10px',
             borderRadius: '4px',
             border: '1px solid #90ee90',
-            fontFamily: "'Vend Sans', sans-serif",
+            fontFamily: "'Instrument Sans', sans-serif",
             display: 'flex',
             flexDirection: 'column',
             gap: '4px',
diff --git a/frontend/src/components/visualizations/StackedView.css b/frontend/src/components/visualizations/StackedView.css
new file mode 100644
index 0000000000000000000000000000000000000000..48032af3f94b037e06887e15a2d6c4fbc941f59c
--- /dev/null
+++ b/frontend/src/components/visualizations/StackedView.css
@@ -0,0 +1,37 @@
+.stacked-view {
+  padding: 1rem;
+  width: 100%;
+  height: 100%;
+  overflow: auto;
+}
+
+.stacked-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  margin-bottom: 1rem;
+}
+
+.stacked-header h3 {
+  margin: 0;
+  font-size: 1.25rem;
+  color: var(--text-primary, #1a1a1a);
+}
+
+.stacked-stats {
+  font-size: 0.9rem;
+  color: var(--text-secondary, #666);
+}
+
+.stacked-svg {
+  border: 1px solid var(--border-color, #e0e0e0);
+  border-radius: 8px;
+  background: var(--bg-primary, #ffffff);
+}
+
+.stacked-empty {
+  padding: 2rem;
+  text-align: center;
+  color: var(--text-secondary, #666);
+}
+
diff --git a/frontend/src/components/visualizations/StackedView.tsx b/frontend/src/components/visualizations/StackedView.tsx
new file mode 100644
index 0000000000000000000000000000000000000000..141f6696a06dff331fb44c178a9cfd36eed69c0b
--- /dev/null
+++ b/frontend/src/components/visualizations/StackedView.tsx
@@ -0,0 +1,142 @@
+/**
+ * Stacked hierarchical view showing model families and relationships.
+ * Uses D3.js for hierarchical layout.
+ */
+import React, { useMemo, useRef, useEffect } from 'react';
+import * as d3 from 'd3';
+import { ModelPoint } from '../../types';
+import './StackedView.css';
+
+interface StackedViewProps {
+  data: ModelPoint[];
+  width?: number;
+  height?: number;
+}
+
+interface HierarchyNode {
+  name: string;
+  children?: HierarchyNode[];
+  value?: number;
+  models?: ModelPoint[];
+}
+
+export default function StackedView({ data, width = 800, height = 600 }: StackedViewProps) {
+  const svgRef = useRef<SVGSVGElement>(null);
+
+  const hierarchyData = useMemo(() => {
+    if (data.length === 0) return null;
+
+    // Build hierarchy: Library → Pipeline → Family
+    const libraryMap = new Map<string, Map<string, Map<string, ModelPoint[]>>>();
+
+    data.forEach(model => {
+      const library = model.library_name || 'Unknown';
+      const pipeline = model.pipeline_tag || 'Unknown';
+      const family = model.parent_model || 'Root';
+
+      if (!libraryMap.has(library)) {
+        libraryMap.set(library, new Map());
+      }
+      const pipelineMap = libraryMap.get(library)!;
+
+      if (!pipelineMap.has(pipeline)) {
+        pipelineMap.set(pipeline, new Map());
+      }
+      const familyMap = pipelineMap.get(pipeline)!;
+
+      if (!familyMap.has(family)) {
+        familyMap.set(family, []);
+      }
+      familyMap.get(family)!.push(model);
+    });
+
+    // Convert to hierarchy structure
+    const root: HierarchyNode = {
+      name: 'Models',
+      children: Array.from(libraryMap.entries()).map(([library, pipelineMap]) => ({
+        name: library,
+        children: Array.from(pipelineMap.entries()).map(([pipeline, familyMap]) => ({
+          name: pipeline,
+          children: Array.from(familyMap.entries()).map(([family, models]) => ({
+            name: family,
+            value: models.length,
+            models,
+          })),
+        })),
+      })),
+    };
+
+    return root;
+  }, [data]);
+
+  useEffect(() => {
+    if (!hierarchyData || !svgRef.current) return;
+
+    const svg = d3.select(svgRef.current);
+    svg.selectAll('*').remove();
+
+    const root = d3.hierarchy(hierarchyData);
+    const treeLayout = d3.tree<HierarchyNode>().size([height - 100, width - 200]);
+    treeLayout(root);
+
+    const g = svg.append('g').attr('transform', 'translate(100, 50)');
+
+    // Links
+    g.selectAll('.link')
+      .data(root.links())
+      .enter()
+      .append('path')
+      .attr('class', 'link')
+      .attr('d', (d: d3.HierarchyLink<HierarchyNode>) => {
+        const link = d3.linkHorizontal<d3.HierarchyPointNode<HierarchyNode>, d3.HierarchyPointNode<HierarchyNode>>()
+          .x((d: d3.HierarchyPointNode<HierarchyNode>) => d.y)
+          .y((d: d3.HierarchyPointNode<HierarchyNode>) => d.x);
+        return link(d as any);
+      })
+      .attr('fill', 'none')
+      .attr('stroke', '#ccc')
+      .attr('stroke-width', 1.5);
+
+    // Nodes
+    const nodes = g.selectAll('.node')
+      .data(root.descendants())
+      .enter()
+      .append('g')
+      .attr('class', 'node')
+      .attr('transform', d => `translate(${d.y},${d.x})`);
+
+    nodes.append('circle')
+      .attr('r', d => Math.sqrt(d.data.value || 1) * 3 + 4)
+      .attr('fill', d => d.depth === 0 ? '#4a90e2' : d.depth === 1 ? '#6ba3e8' : '#8bb5ed')
+      .attr('stroke', '#fff')
+      .attr('stroke-width', 2);
+
+    nodes.append('text')
+      .attr('dy', '.35em')
+      .attr('x', d => (d.children ? -13 : 13))
+      .style('text-anchor', d => (d.children ? 'end' : 'start'))
+      .text(d => d.data.name)
+      .style('font-size', '10px')
+      .style('fill', 'var(--text-primary, #1a1a1a)');
+
+  }, [hierarchyData, width, height]);
+
+  if (!hierarchyData) {
+    return (
+      <div className="stacked-view">
+        <div className="stacked-empty">No data to display</div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="stacked-view">
+      <div className="stacked-header">
+        <h3>Hierarchical Model Structure</h3>
+        <div className="stacked-stats">Total Models: {data.length.toLocaleString()}</div>
+      </div>
+      <svg ref={svgRef} width={width} height={height} className="stacked-svg" />
+    </div>
+  );
+}
+
diff --git a/frontend/src/components/UVProjectionSquare.tsx b/frontend/src/components/visualizations/UVProjectionSquare.tsx
similarity index 95%
rename from frontend/src/components/UVProjectionSquare.tsx
rename to frontend/src/components/visualizations/UVProjectionSquare.tsx
index 8eb0d57455edbc942b40d1c14dea2d3737dc8fd1..038787d60e1d7ae655fd056c8008bee07d083b48 100644
--- a/frontend/src/components/UVProjectionSquare.tsx
+++ b/frontend/src/components/visualizations/UVProjectionSquare.tsx
@@ -4,8 +4,8 @@
  */
 import React, { useMemo, useRef, useEffect, useState, memo } from 'react';
 import * as d3 from 'd3';
-import { ModelPoint } from '../types';
-import { getCategoricalColorMap, getContinuousColorScale } from '../utils/colors';
+import { ModelPoint } from '../../types';
+import { getCategoricalColorMap, getContinuousColorScale } from '../../utils/rendering/colors';
 
 interface UVProjectionSquareProps {
   width: number;
@@ -34,15 +34,18 @@ const UVProjectionSquare = memo(function UVProjectionSquare({
 
   // Sample data for very large datasets to improve performance and navigability
   const sampledData = useMemo(() => {
-    // Reduced limit for better sparsity in minimap
-    const renderLimit = 15000; // Reduced from 20K to 15K
+    // Optimized limit for minimap performance
+    const renderLimit = 20000; // Increased but with better sampling
     if (data.length <= renderLimit) return data;
     
-    // Use step-based sampling for better distribution
+    // Use efficient step-based sampling with better distribution
     const step = Math.ceil(data.length / renderLimit);
     const sampled: typeof data = [];
-    for (let i = 0; i < data.length; i += step) {
-      sampled.push(data[i]);
+    // Pre-allocate array for better performance
+    sampled.length = Math.min(renderLimit, Math.ceil(data.length / step));
+    let idx = 0;
+    for (let i = 0; i < data.length && idx < sampled.length; i += step) {
+      sampled[idx++] = data[i];
     }
     return sampled;
   }, [data]);
@@ -299,7 +302,7 @@ const UVProjectionSquare = memo(function UVProjectionSquare({
         background: 'rgba(255, 255, 255, 0.9)',
         padding: '2px 6px',
         borderRadius: '2px',
-        fontFamily: "'Vend Sans', sans-serif",
+        fontFamily: "'Instrument Sans', sans-serif",
       }}>
         Click to navigate
       </div>
diff --git a/frontend/src/config/api.ts b/frontend/src/config/api.ts
new file mode 100644
index 0000000000000000000000000000000000000000..e2d08435d7397f5c98c058099b9435dcbb1a2392
--- /dev/null
+++ b/frontend/src/config/api.ts
@@ -0,0 +1,5 @@
+/**
+ * API configuration constants
+ */
+export const API_BASE = process.env.REACT_APP_API_URL || 'http://localhost:8000';
+
diff --git a/frontend/src/stores/filterStore.ts b/frontend/src/stores/filterStore.ts
new file mode 100644
index 0000000000000000000000000000000000000000..b5a050ab3a617110763e4f9b0f54d0142618c85f
--- /dev/null
+++ b/frontend/src/stores/filterStore.ts
@@ -0,0 +1,148 @@
+/**
+ * Zustand store for managing filter state across the application.
+ * Centralizes filter logic for better performance and maintainability.
+ */
+import { create } from 'zustand';
+
+export type ColorByOption = 'domain' | 'license' | 'family' | 'library' | 'library_name' | 'pipeline_tag' | 'cluster_id' | 'downloads' | 'likes' | 'family_depth' | 'trending_score' | 'licenses';
+export type SizeByOption = 'downloads' | 'likes' | 'none';
+export type ViewMode = '2d' | '3d' | 'scatter' | 'network' | 'distribution' | 'stacked' | 'heatmap';
+export type RenderingStyle = 'embeddings' | 'sphere' | 'galaxy' | 'wave' | 'helix' | 'torus';
+export type Theme = 'light' | 'dark';
+
+interface FilterState {
+  // Filters
+  domains: string[];
+  licenses: string[];
+  dateRange: [number, number] | null;
+  isBaseModel: boolean | null;
+  minDownloads: number;
+  minLikes: number;
+  searchQuery: string;
+  selectedClusters: number[];
+  
+  // View state
+  colorBy: ColorByOption;
+  sizeBy: SizeByOption;
+  viewMode: ViewMode;
+  colorScheme: 'viridis' | 'plasma' | 'inferno' | 'magma' | 'coolwarm';
+  showLabels: boolean;
+  zoomLevel: number;
+  nodeDensity: number;
+  renderingStyle: RenderingStyle;
+  theme: Theme;
+  
+  // Actions
+  setDomains: (domains: string[]) => void;
+  setLicenses: (licenses: string[]) => void;
+  setDateRange: (range: [number, number] | null) => void;
+  setIsBaseModel: (value: boolean | null) => void;
+  setMinDownloads: (value: number) => void;
+  setMinLikes: (value: number) => void;
+  setSearchQuery: (query: string) => void;
+  setSelectedClusters: (clusters: number[]) => void;
+  setColorBy: (value: ColorByOption) => void;
+  setSizeBy: (value: SizeByOption) => void;
+  setViewMode: (mode: ViewMode) => void;
+  setColorScheme: (scheme: FilterState['colorScheme']) => void;
+  setShowLabels: (show: boolean) => void;
+  setZoomLevel: (level: number) => void;
+  setNodeDensity: (density: number) => void;
+  setRenderingStyle: (style: RenderingStyle) => void;
+  setTheme: (theme: Theme) => void;
+  toggleTheme: () => void;
+  resetFilters: () => void;
+  
+  // Computed
+  getActiveFilterCount: () => number;
+}
+
+// Load theme from localStorage or default to light
+const getInitialTheme = (): Theme => {
+  if (typeof window !== 'undefined') {
+    const saved = localStorage.getItem('theme');
+    if (saved === 'dark' || saved === 'light') return saved;
+    // Check system preference
+    if (window.matchMedia && window.matchMedia('(prefers-color-scheme: dark)').matches) {
+      return 'dark';
+    }
+  }
+  return 'light';
+};
+
+export const useFilterStore = create<FilterState>((set, get) => ({
+  // Initial state
+  domains: [],
+  licenses: [],
+  dateRange: null,
+  isBaseModel: null,
+  minDownloads: 0,
+  minLikes: 0,
+  searchQuery: '',
+  selectedClusters: [],
+  colorBy: 'library_name',
+  sizeBy: 'downloads',
+  viewMode: '3d',
+  colorScheme: 'viridis',
+  showLabels: false,
+  zoomLevel: 1,
+  nodeDensity: 100,
+  renderingStyle: 'embeddings',
+  theme: getInitialTheme(),
+  
+  // Actions
+  setDomains: (domains: string[]) => set({ domains }),
+  setLicenses: (licenses: string[]) => set({ licenses }),
+  setDateRange: (range: [number, number] | null) => set({ dateRange: range }),
+  setIsBaseModel: (value: boolean | null) => set({ isBaseModel: value }),
+  setMinDownloads: (value: number) => set({ minDownloads: value }),
+  setMinLikes: (value: number) => set({ minLikes: value }),
+  setSearchQuery: (query: string) => set({ searchQuery: query }),
+  setSelectedClusters: (clusters: number[]) => set({ selectedClusters: clusters }),
+  setColorBy: (value: ColorByOption) => set({ colorBy: value }),
+  setSizeBy: (value: SizeByOption) => set({ sizeBy: value }),
+  setViewMode: (mode: ViewMode) => set({ viewMode: mode }),
+  setColorScheme: (scheme: FilterState['colorScheme']) => set({ colorScheme: scheme }),
+  setShowLabels: (show: boolean) => set({ showLabels: show }),
+  setZoomLevel: (level: number) => set({ zoomLevel: level }),
+  setNodeDensity: (density: number) => set({ nodeDensity: density }),
+  setRenderingStyle: (style: RenderingStyle) => set({ renderingStyle: style }),
+  setTheme: (theme: Theme) => {
+    set({ theme });
+    if (typeof window !== 'undefined') {
+      localStorage.setItem('theme', theme);
+      document.documentElement.setAttribute('data-theme', theme);
+    }
+  },
+  toggleTheme: () => {
+    const currentTheme = get().theme;
+    const newTheme = currentTheme === 'light' ? 'dark' : 'light';
+    get().setTheme(newTheme);
+  },
+  
+  resetFilters: () => set({
+    domains: [],
+    licenses: [],
+    dateRange: null,
+    isBaseModel: null,
+    minDownloads: 0,
+    minLikes: 0,
+    searchQuery: '',
+    selectedClusters: [],
+  }),
+  
+  getActiveFilterCount: () => {
+    const state = get();
+    let count = 0;
+    if (state.domains.length > 0) count++;
+    if (state.licenses.length > 0) count++;
+    if (state.dateRange !== null) count++;
+    if (state.isBaseModel !== null) count++;
+    if (state.minDownloads > 0) count++;
+    if (state.minLikes > 0) count++;
+    if (state.searchQuery.length > 0) count++;
+    if (state.selectedClusters.length > 0) count++;
+    return count;
+  },
+}));
+
diff --git a/frontend/src/types.ts b/frontend/src/types.ts
index 81672f646019d6387b0cec59b3f3d6cd8200f4c7..2fa42251a2632d0561040c4d0647a861d2973bf6 100644
--- a/frontend/src/types.ts
+++ b/frontend/src/types.ts
@@ -13,6 +13,7 @@ export interface ModelPoint {
   licenses: string | null;
   family_depth: number | null;  // Generation depth in family tree (0 = root)
   cluster_id: number | null;    // Cluster assignment for visualization
+  created_at: string | null;    // ISO format date string
 }
 
 export interface FamilyTree {
@@ -53,6 +54,8 @@ export interface Stats {
   unique_libraries: number;
   unique_pipelines: number;  // Deprecated: use unique_task_types
   unique_task_types?: number;  // Number of distinct ML task types (e.g., text-classification, image-classification)
+  unique_licenses?: number;
+  licenses?: Record<string, number>;  // License name -> count mapping
   avg_downloads: number;
   avg_likes: number;
 }
diff --git a/frontend/src/utils/api/hfUrl.ts b/frontend/src/utils/api/hfUrl.ts
new file mode 100644
index 0000000000000000000000000000000000000000..02d4b973f7d91dcbcbaabe38799b01f520843e6e
--- /dev/null
+++ b/frontend/src/utils/api/hfUrl.ts
@@ -0,0 +1,54 @@
+/**
+ * Constructs a Hugging Face URL for a model or collection.
+ * 
+ * @param modelId - Model ID in format "username/model_name" or "username/collection_name"
+ * @param isCollection - Whether this is a collection (default: false)
+ * @returns Properly formatted Hugging Face URL
+ */
+export function getHuggingFaceUrl(modelId: string, isCollection: boolean = false): string {
+  if (!modelId) {
+    return 'https://huggingface.co';
+  }
+
+  const encodedId = encodeURIComponent(modelId).replace(/%2F/g, '/');
+  
+  if (isCollection) {
+    return `https://huggingface.co/collections/${encodedId}`;
+  }
+  
+  return `https://huggingface.co/${encodedId}`;
+}
+
+/**
+ * Constructs a Hugging Face API URL for a model.
+ * 
+ * @param modelId - Model ID in format "username/model_name"
+ * @returns Properly formatted Hugging Face API URL
+ */
+export function getHuggingFaceApiUrl(modelId: string): string {
+  if (!modelId) {
+    return 'https://huggingface.co/api/models';
+  }
+
+  const encodedId = encodeURIComponent(modelId);
+  return `https://huggingface.co/api/models/${encodedId}`;
+}
+
+/**
+ * Constructs a Hugging Face file tree URL for a model.
+ * 
+ * @param modelId - Model ID in format "username/model_name"
+ * @param branch - Git branch name (default: "main")
+ * @returns Properly formatted Hugging Face file tree URL
+ */
+export function getHuggingFaceFileTreeUrl(modelId: string, branch: string = 'main'): string {
+  if (!modelId) {
+    return 'https://huggingface.co';
+  }
+
+  const encodedId = encodeURIComponent(modelId);
+  const encodedBranch = encodeURIComponent(branch);
+  return `https://huggingface.co/${encodedId}/tree/${encodedBranch}`;
+}
+
+
diff --git a/frontend/src/utils/requestManager.ts b/frontend/src/utils/api/requestManager.ts
similarity index 100%
rename from frontend/src/utils/requestManager.ts
rename to frontend/src/utils/api/requestManager.ts
diff --git a/frontend/src/utils/indexedDB.ts b/frontend/src/utils/indexedDB.ts
deleted file mode 100644
index d4c094535afd72d4fcc6f2177552379037b7efc8..0000000000000000000000000000000000000000
--- a/frontend/src/utils/indexedDB.ts
+++ /dev/null
@@ -1,226 +0,0 @@
-/**
- * IndexedDB utility for client-side caching of embeddings and model data.
- * Enables offline access and faster subsequent loads.
- */
-
-const DB_NAME = 'hf_viz_cache';
-const DB_VERSION = 1;
-
-interface CacheEntry<T> {
-  key: string;
-  data: T;
-  timestamp: number;
-  version: string;
-}
-
-const CACHE_VERSION = '1.0.0'; // Increment to invalidate old cache
-const CACHE_TTL_MS = 7 * 24 * 60 * 60 * 1000; // 7 days
-const MAX_CACHE_SIZE = 100; // Maximum number of entries per store
-
-class IndexedDBCache {
-  private db: IDBDatabase | null = null;
-  private initPromise: Promise<void> | null = null;
-
-  private async init(): Promise<void> {
-    if (this.db) return;
-    if (this.initPromise) return this.initPromise;
-
-    this.initPromise = new Promise((resolve, reject) => {
-      const request = indexedDB.open(DB_NAME, DB_VERSION);
-
-      request.onerror = () => reject(request.error);
-      request.onsuccess = () => {
-        this.db = request.result;
-        resolve();
-      };
-
-      request.onupgradeneeded = (event) => {
-        const db = (event.target as IDBOpenDBRequest).result;
-
-        // Create object stores
-        if (!db.objectStoreNames.contains('embeddings')) {
-          db.createObjectStore('embeddings', { keyPath: 'key' });
-        }
-        if (!db.objectStoreNames.contains('reduced_embeddings')) {
-          db.createObjectStore('reduced_embeddings', { keyPath: 'key' });
-        }
-        if (!db.objectStoreNames.contains('models')) {
-          db.createObjectStore('models', { keyPath: 'key' });
-        }
-        if (!db.objectStoreNames.contains('stats')) {
-          db.createObjectStore('stats', { keyPath: 'key' });
-        }
-      };
-    });
-
-    return this.initPromise;
-  }
-
-  private async getStore(storeName: string): Promise<IDBObjectStore> {
-    await this.init();
-    if (!this.db) throw new Error('Database not initialized');
-
-    const transaction = this.db.transaction([storeName], 'readwrite');
-    return transaction.objectStore(storeName);
-  }
-
-  async set<T>(storeName: string, key: string, data: T): Promise<void> {
-    const store = await this.getStore(storeName);
-    
-    // Enforce cache size limit - delete oldest entries if at limit
-    const count = await this.getCacheSize(storeName);
-    if (count >= MAX_CACHE_SIZE) {
-      // Get all entries, sort by timestamp, delete oldest
-      const allEntries: Array<{ key: string; timestamp: number }> = [];
-      const getAllRequest = store.openCursor();
-      
-      await new Promise<void>((resolve, reject) => {
-        getAllRequest.onsuccess = (event: any) => {
-          const cursor = event.target.result;
-          if (cursor) {
-            const entry = cursor.value as CacheEntry<T>;
-            allEntries.push({ key: entry.key, timestamp: entry.timestamp });
-            cursor.continue();
-          } else {
-            resolve();
-          }
-        };
-        getAllRequest.onerror = () => reject(getAllRequest.error);
-      });
-      
-      // Sort by timestamp (oldest first) and delete excess
-      allEntries.sort((a, b) => a.timestamp - b.timestamp);
-      const toDelete = allEntries.slice(0, count - MAX_CACHE_SIZE + 1);
-      
-      for (const entry of toDelete) {
-        await this.delete(storeName, entry.key);
-      }
-    }
-    
-    const entry: CacheEntry<T> = {
-      key,
-      data,
-      timestamp: Date.now(),
-      version: CACHE_VERSION,
-    };
-
-    return new Promise((resolve, reject) => {
-      const request = store.put(entry);
-      request.onsuccess = () => resolve();
-      request.onerror = () => reject(request.error);
-    });
-  }
-
-  async get<T>(storeName: string, key: string): Promise<T | null> {
-    const store = await this.getStore(storeName);
-
-    return new Promise((resolve, reject) => {
-      const request = store.get(key);
-      request.onsuccess = () => {
-        const entry = request.result as CacheEntry<T> | undefined;
-        if (!entry) {
-          resolve(null);
-          return;
-        }
-
-        // Check version
-        if (entry.version !== CACHE_VERSION) {
-          // Version mismatch, delete old entry
-          store.delete(key);
-          resolve(null);
-          return;
-        }
-
-        // Check TTL
-        const age = Date.now() - entry.timestamp;
-        if (age > CACHE_TTL_MS) {
-          // Cache expired, delete old entry
-          store.delete(key);
-          resolve(null);
-          return;
-        }
-
-        resolve(entry.data);
-      };
-      request.onerror = () => reject(request.error);
-    });
-  }
-
-  async has(storeName: string, key: string): Promise<boolean> {
-    const store = await this.getStore(storeName);
-
-    return new Promise((resolve, reject) => {
-      const request = store.getKey(key);
-      request.onsuccess = () => resolve(request.result !== undefined);
-      request.onerror = () => reject(request.error);
-    });
-  }
-
-  async delete(storeName: string, key: string): Promise<void> {
-    const store = await this.getStore(storeName);
-
-    return new Promise((resolve, reject) => {
-      const request = store.delete(key);
-      request.onsuccess = () => resolve();
-      request.onerror = () => reject(request.error);
-    });
-  }
-
-  async clear(storeName: string): Promise<void> {
-    const store = await this.getStore(storeName);
-
-    return new Promise((resolve, reject) => {
-      const request = store.clear();
-      request.onsuccess = () => resolve();
-      request.onerror = () => reject(request.error);
-    });
-  }
-
-  async getCacheSize(storeName: string): Promise<number> {
-    const store = await this.getStore(storeName);
-
-    return new Promise((resolve, reject) => {
-      const request = store.count();
-      request.onsuccess = () => resolve(request.result);
-      request.onerror = () => reject(request.error);
-    });
-  }
-
-  // Helper methods for specific data types
-  async cacheModels(key: string, models: any[]): Promise<void> {
-    return this.set('models', key, models);
-  }
-
-  async getCachedModels(key: string): Promise<any[] | null> {
-    return this.get<any[]>('models', key);
-  }
-
-  async cacheStats(key: string, stats: any): Promise<void> {
-    return this.set('stats', key, stats);
-  }
-
-  async getCachedStats(key: string): Promise<any | null> {
-    return this.get<any>('stats', key);
-  }
-
-  // Generate cache key from filter parameters
-  static generateCacheKey(params: {
-    minDownloads: number;
-    minLikes: number;
-    searchQuery?: string;
-    projectionMethod: string;
-  }): string {
-    return JSON.stringify({
-      minDownloads: params.minDownloads,
-      minLikes: params.minLikes,
-      searchQuery: params.searchQuery || '',
-      projectionMethod: params.projectionMethod,
-    });
-  }
-}
-
-// Export singleton instance
-export const cache = new IndexedDBCache();
-export { IndexedDBCache };
-export default cache;
-
diff --git a/frontend/src/utils/colors.ts b/frontend/src/utils/rendering/colors.ts
similarity index 65%
rename from frontend/src/utils/colors.ts
rename to frontend/src/utils/rendering/colors.ts
index 3d21e72948651ff3b11a125d443c7926f08da846..b3074dcda8e1095f22a7c486ae54c685875f5a1c 100644
--- a/frontend/src/utils/colors.ts
+++ b/frontend/src/utils/rendering/colors.ts
@@ -3,12 +3,12 @@
  * Supports categorical and continuous color scales.
  */
 
-// Extended color palettes for better variety
+// Extended color palettes for better variety - Enhanced vibrancy
 export const CATEGORICAL_COLORS = [
-  '#1f77b4', '#ff7f0e', '#2ca02c', '#d62728', '#9467bd',
-  '#8c564b', '#e377c2', '#7f7f7f', '#bcbd22', '#17becf',
-  '#aec7e8', '#ffbb78', '#98df8a', '#ff9896', '#c5b0d5',
-  '#c49c94', '#f7b6d3', '#c7c7c7', '#dbdb8d', '#9edae5',
+  '#2563eb', '#f59e0b', '#10b981', '#ef4444', '#8b5cf6',
+  '#ec4899', '#06b6d4', '#84cc16', '#f97316', '#6366f1',
+  '#14b8a6', '#a855f7', '#f43f5e', '#0ea5e9', '#22c55e',
+  '#eab308', '#3b82f6', '#8b5cf6', '#ec4899', '#06b6d4',
   '#6b6ecf', '#b5cf6b', '#bd9e39', '#e7969c', '#7b4173',
   '#a55194', '#ce6dbd', '#de9ed6', '#636363', '#8ca252',
   '#b5a252', '#d6616b', '#e7ba52', '#ad494a', '#843c39',
@@ -16,38 +16,38 @@ export const CATEGORICAL_COLORS = [
   '#637939', '#bd9e39', '#d6616b', '#e7969c', '#e7ba52',
 ];
 
-// Color schemes for different features
+// Color schemes for different features - Enhanced vibrancy
 export const LIBRARY_COLORS: Record<string, string> = {
-  'transformers': '#1f77b4',
-  'diffusers': '#ff7f0e',
-  'sentence-transformers': '#2ca02c',
-  'timm': '#d62728',
-  'speechbrain': '#9467bd',
-  'fairseq': '#8c564b',
-  'espnet': '#e377c2',
-  'asteroid': '#7f7f7f',
-  'keras': '#bcbd22',
-  'sklearn': '#17becf',
-  'unknown': '#cccccc',
+  'transformers': '#2563eb',
+  'diffusers': '#f59e0b',
+  'sentence-transformers': '#10b981',
+  'timm': '#ef4444',
+  'speechbrain': '#8b5cf6',
+  'fairseq': '#ec4899',
+  'espnet': '#06b6d4',
+  'asteroid': '#84cc16',
+  'keras': '#f97316',
+  'sklearn': '#6366f1',
+  'unknown': '#9ca3af',
 };
 
 export const PIPELINE_COLORS: Record<string, string> = {
-  'text-classification': '#1f77b4',
-  'token-classification': '#ff7f0e',
-  'question-answering': '#2ca02c',
-  'summarization': '#d62728',
-  'translation': '#9467bd',
-  'text-generation': '#8c564b',
-  'fill-mask': '#e377c2',
-  'zero-shot-classification': '#7f7f7f',
-  'automatic-speech-recognition': '#bcbd22',
-  'text-to-speech': '#17becf',
-  'image-classification': '#aec7e8',
-  'object-detection': '#ffbb78',
-  'image-segmentation': '#98df8a',
-  'image-to-text': '#ff9896',
-  'text-to-image': '#c5b0d5',
-  'unknown': '#cccccc',
+  'text-classification': '#2563eb',
+  'token-classification': '#f59e0b',
+  'question-answering': '#10b981',
+  'summarization': '#ef4444',
+  'translation': '#8b5cf6',
+  'text-generation': '#ec4899',
+  'fill-mask': '#06b6d4',
+  'zero-shot-classification': '#84cc16',
+  'automatic-speech-recognition': '#f97316',
+  'text-to-speech': '#6366f1',
+  'image-classification': '#14b8a6',
+  'object-detection': '#a855f7',
+  'image-segmentation': '#f43f5e',
+  'image-to-text': '#0ea5e9',
+  'text-to-image': '#22c55e',
+  'unknown': '#9ca3af',
 };
 
 // Continuous color scales with optional logarithmic scaling
@@ -64,28 +64,36 @@ export function getContinuousColorScale(
   const logMax = useLogScale && max > 0 ? Math.log10(max + 1) : max;
   const logRange = logMax - logMin || 1;
   
-  // Viridis-like color scale (blue to yellow)
+  // Viridis-like color scale (blue to yellow) - Enhanced vibrancy
   const viridis = (t: number) => {
-    const r = Math.floor(68 + (253 - 68) * t);
-    const g = Math.floor(1 + (231 - 1) * t);
-    const b = Math.floor(84 + (37 - 84) * t);
-    return `rgb(${r}, ${g}, ${b})`;
+    // Apply gamma correction for more vibrant colors
+    const gamma = 0.7;
+    const tGamma = Math.pow(t, gamma);
+    const r = Math.floor(68 + (253 - 68) * tGamma);
+    const g = Math.floor(1 + (231 - 1) * tGamma);
+    const b = Math.floor(84 + (37 - 84) * tGamma);
+    // Increase saturation slightly
+    return `rgb(${Math.min(255, r)}, ${Math.min(255, g)}, ${Math.min(255, b)})`;
   };
   
-  // Plasma color scale (purple to yellow)
+  // Plasma color scale (purple to yellow) - Enhanced vibrancy
   const plasma = (t: number) => {
-    const r = Math.floor(13 + (240 - 13) * t);
-    const g = Math.floor(8 + (249 - 8) * t);
-    const b = Math.floor(135 + (33 - 135) * t);
-    return `rgb(${r}, ${g}, ${b})`;
+    const gamma = 0.7;
+    const tGamma = Math.pow(t, gamma);
+    const r = Math.floor(13 + (240 - 13) * tGamma);
+    const g = Math.floor(8 + (249 - 8) * tGamma);
+    const b = Math.floor(135 + (33 - 135) * tGamma);
+    return `rgb(${Math.min(255, r)}, ${Math.min(255, g)}, ${Math.min(255, b)})`;
   };
   
-  // Inferno color scale (black to yellow)
+  // Inferno color scale (black to yellow) - Enhanced vibrancy
   const inferno = (t: number) => {
-    const r = Math.floor(0 + (252 - 0) * t);
-    const g = Math.floor(0 + (141 - 0) * t);
-    const b = Math.floor(4 + (89 - 4) * t);
-    return `rgb(${r}, ${g}, ${b})`;
+    const gamma = 0.6;
+    const tGamma = Math.pow(t, gamma);
+    const r = Math.floor(0 + (252 - 0) * tGamma);
+    const g = Math.floor(0 + (141 - 0) * tGamma);
+    const b = Math.floor(4 + (89 - 4) * tGamma);
+    return `rgb(${Math.min(255, r)}, ${Math.min(255, g)}, ${Math.min(255, b)})`;
   };
   
   // Cool-warm color scale (blue to red)
diff --git a/frontend/src/utils/frustumCulling.ts b/frontend/src/utils/rendering/frustumCulling.ts
similarity index 98%
rename from frontend/src/utils/frustumCulling.ts
rename to frontend/src/utils/rendering/frustumCulling.ts
index 9e39d4d7b29dfeb4c871a7901e1a9e106c00c41a..f33be09a824030d8c35c8a9bf31dad1a4fc2f27a 100644
--- a/frontend/src/utils/frustumCulling.ts
+++ b/frontend/src/utils/rendering/frustumCulling.ts
@@ -4,7 +4,7 @@
  */
 
 import * as THREE from 'three';
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 
 /**
  * Calculate camera frustum planes from camera and renderer
diff --git a/frontend/src/utils/rendering/layoutTransforms.ts b/frontend/src/utils/rendering/layoutTransforms.ts
new file mode 100644
index 0000000000000000000000000000000000000000..aed1e045c0eb4dd62f2b8fb90f1ac1bf60e9b4c4
--- /dev/null
+++ b/frontend/src/utils/rendering/layoutTransforms.ts
@@ -0,0 +1,97 @@
+/**
+ * Layout transformation utilities for different rendering styles.
+ * Transforms 3D coordinates based on selected rendering style.
+ */
+import { ModelPoint } from '../../types';
+
+export type RenderingStyle = 'embeddings' | 'sphere' | 'galaxy' | 'wave' | 'helix' | 'torus';
+
+/**
+ * Transform model coordinates based on rendering style.
+ */
+export function transformLayout(
+  model: ModelPoint,
+  style: RenderingStyle,
+  index: number,
+  total: number
+): [number, number, number] {
+  const { x, y, z } = model;
+  
+  switch (style) {
+    case 'embeddings':
+      // Use original embedding coordinates
+      return [x, y, z];
+    
+    case 'sphere':
+      // Map to sphere surface
+      const radius = 3;
+      const theta = Math.atan2(y, x); // Azimuthal angle
+      const phi = Math.acos(z / Math.sqrt(x * x + y * y + z * z)); // Polar angle
+      return [
+        radius * Math.sin(phi) * Math.cos(theta),
+        radius * Math.sin(phi) * Math.sin(theta),
+        radius * Math.cos(phi)
+      ];
+    
+    case 'galaxy':
+      // Spiral galaxy pattern
+      const galaxyRadius = 2 + (index / total) * 2;
+      const galaxyAngle = (index / total) * Math.PI * 8; // Multiple spirals
+      const galaxyZ = (index / total - 0.5) * 2;
+      return [
+        galaxyRadius * Math.cos(galaxyAngle),
+        galaxyRadius * Math.sin(galaxyAngle),
+        galaxyZ
+      ];
+    
+    case 'wave':
+      // Wave pattern based on original coordinates
+      const waveX = x;
+      const waveY = y;
+      const waveZ = Math.sin(x * 2) * Math.cos(y * 2) * 1.5;
+      return [waveX, waveY, waveZ];
+    
+    case 'helix':
+      // Helical arrangement
+      const helixRadius = 2;
+      const helixAngle = (index / total) * Math.PI * 4;
+      const helixZ = (index / total - 0.5) * 4;
+      return [
+        helixRadius * Math.cos(helixAngle),
+        helixRadius * Math.sin(helixAngle),
+        helixZ
+      ];
+    
+    case 'torus':
+      // Torus/donut shape
+      const majorRadius = 2.5;
+      const minorRadius = 1;
+      const torusAngle = (index / total) * Math.PI * 2;
+      const torusTubeAngle = (index / total) * Math.PI * 4;
+      return [
+        (majorRadius + minorRadius * Math.cos(torusTubeAngle)) * Math.cos(torusAngle),
+        (majorRadius + minorRadius * Math.cos(torusTubeAngle)) * Math.sin(torusAngle),
+        minorRadius * Math.sin(torusTubeAngle)
+      ];
+    
+    default:
+      return [x, y, z];
+  }
+}
+
+/**
+ * Get geometry type for rendering style.
+ */
+export function getGeometryType(style: RenderingStyle): 'sphere' | 'torus' | 'box' {
+  switch (style) {
+    case 'torus':
+      return 'torus';
+    case 'sphere':
+    case 'galaxy':
+    case 'helix':
+      return 'sphere';
+    default:
+      return 'sphere';
+  }
+}
+
diff --git a/frontend/src/utils/spatialIndex.ts b/frontend/src/utils/rendering/spatialIndex.ts
similarity index 99%
rename from frontend/src/utils/spatialIndex.ts
rename to frontend/src/utils/rendering/spatialIndex.ts
index 2bec2fed4010c6607462c8c590bbe059de631332..419688c387c545f25745430fa6e3b6d18c56f5b6 100644
--- a/frontend/src/utils/spatialIndex.ts
+++ b/frontend/src/utils/rendering/spatialIndex.ts
@@ -3,7 +3,7 @@
  * Uses Octree for O(log n) nearest neighbor and range queries.
  */
 
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 
 interface BoundingBox {
   minX: number;
diff --git a/frontend/src/utils/spatialSparsity.ts b/frontend/src/utils/rendering/spatialSparsity.ts
similarity index 99%
rename from frontend/src/utils/spatialSparsity.ts
rename to frontend/src/utils/rendering/spatialSparsity.ts
index 70fd89ea770933e5aa401ad6c3846b8b00cd34a7..4f9951fca0c87f65df1d5a3e5e4cbfea8dc691e7 100644
--- a/frontend/src/utils/spatialSparsity.ts
+++ b/frontend/src/utils/rendering/spatialSparsity.ts
@@ -3,7 +3,7 @@
  * Filters points to ensure minimum distance between them.
  */
 
-import { ModelPoint } from '../types';
+import { ModelPoint } from '../../types';
 
 /**
  * Filter points to ensure minimum distance between them (spatial sparsification)
diff --git a/frontend/src/workers/dataLoader.worker.ts b/frontend/src/workers/dataLoader.worker.ts
new file mode 100644
index 0000000000000000000000000000000000000000..365af656d78038f838fe664d565022dc6583cec1
--- /dev/null
+++ b/frontend/src/workers/dataLoader.worker.ts
@@ -0,0 +1,234 @@
+/**
+ * Web Worker for loading and parsing binary dataset format.
+ * Runs off main thread to avoid blocking UI.
+ */
+
+interface BinaryHeader {
+  magic: string;
+  version: number;
+  numModels: number;
+  numDomains: number;
+  numLicenses: number;
+  numFamilies: number;
+}
+
+interface ModelData {
+  x: Float32Array;
+  y: Float32Array;
+  z: Float32Array;
+  domainId: Uint8Array;
+  licenseId: Uint8Array;
+  familyId: Uint16Array;
+  flags: Uint8Array;
+  modelIds: string[];
+  domains: string[];
+  licenses: string[];
+}
+
+interface LoadMessage {
+  type: 'load';
+  binaryUrl: string;
+  modelIdsUrl: string;
+  metadataUrl: string;
+}
+
+interface FilterMessage {
+  type: 'filter';
+  data: ModelData;
+  criteria: {
+    domains?: string[];
+    licenses?: string[];
+    isBaseModel?: boolean | null;
+  };
+}
+
+self.onmessage = async (e: MessageEvent<LoadMessage | FilterMessage>) => {
+  const message = e.data;
+
+  if (message.type === 'load') {
+    try {
+      // Fetch all files in parallel
+      const [binaryResponse, modelIdsResponse, metadataResponse] = await Promise.all([
+        fetch(message.binaryUrl),
+        fetch(message.modelIdsUrl),
+        fetch(message.metadataUrl),
+      ]);
+
+      if (!binaryResponse.ok || !modelIdsResponse.ok || !metadataResponse.ok) {
+        throw new Error('Failed to fetch binary data files');
+      }
+
+      const arrayBuffer = await binaryResponse.arrayBuffer();
+      const modelIds: string[] = await modelIdsResponse.json();
+      const metadata: { domains: string[]; licenses: string[] } = await metadataResponse.json();
+
+      const view = new DataView(arrayBuffer);
+      let offset = 0;
+
+      // Parse header (64 bytes)
+      const magicBytes = new Uint8Array(arrayBuffer, offset, 5);
+      // Convert Uint8Array to array for spread operator
+      const magicArray = Array.from(magicBytes);
+      const magic = String.fromCharCode(...magicArray);
+      offset += 5;
+
+      if (magic !== 'HFVIZ') {
+        throw new Error(`Invalid binary format. Expected 'HFVIZ', got '${magic}'`);
+      }
+
+      const version = view.getUint8(offset);
+      offset += 1;
+      const numModels = view.getUint32(offset, true);
+      offset += 4;
+      const numDomains = view.getUint32(offset, true);
+      offset += 4;
+      const numLicenses = view.getUint32(offset, true);
+      offset += 4;
+      const numFamilies = view.getUint16(offset, true);
+      offset += 2;
+      offset += 50; // Skip reserved bytes
+
+      // Parse domain lookup table (32 bytes per domain)
+      const domains: string[] = [];
+      for (let i = 0; i < numDomains; i++) {
+        const domainBytes = new Uint8Array(arrayBuffer, offset, 32);
+        const domain = new TextDecoder().decode(domainBytes).replace(/\0/g, '');
+        domains.push(domain);
+        offset += 32;
+      }
+
+      // Parse license lookup table (32 bytes per license)
+      const licenses: string[] = [];
+      for (let i = 0; i < numLicenses; i++) {
+        const licenseBytes = new Uint8Array(arrayBuffer, offset, 32);
+        const license = new TextDecoder().decode(licenseBytes).replace(/\0/g, '');
+        licenses.push(license);
+        offset += 32;
+      }
+
+      // Parse model records (16 bytes each: f32 x, f32 y, f32 z, u8 domain, u8 license, u16 family, u8 flags)
+      const x = new Float32Array(numModels);
+      const y = new Float32Array(numModels);
+      const z = new Float32Array(numModels);
+      const domainId = new Uint8Array(numModels);
+      const licenseId = new Uint8Array(numModels);
+      const familyId = new Uint16Array(numModels);
+      const flags = new Uint8Array(numModels);
+
+      for (let i = 0; i < numModels; i++) {
+        x[i] = view.getFloat32(offset, true);
+        offset += 4;
+        y[i] = view.getFloat32(offset, true);
+        offset += 4;
+        z[i] = view.getFloat32(offset, true);
+        offset += 4;
+        domainId[i] = view.getUint8(offset);
+        offset += 1;
+        licenseId[i] = view.getUint8(offset);
+        offset += 1;
+        familyId[i] = view.getUint16(offset, true);
+        offset += 2;
+        flags[i] = view.getUint8(offset);
+        offset += 1;
+      }
+
+      // Use metadata domains/licenses if available (more reliable)
+      const finalDomains = metadata.domains && metadata.domains.length > 0 ? metadata.domains : domains;
+      const finalLicenses = metadata.licenses && metadata.licenses.length > 0 ? metadata.licenses : licenses;
+
+      const data: ModelData = {
+        x,
+        y,
+        z,
+        domainId,
+        licenseId,
+        familyId,
+        flags,
+        modelIds,
+        domains: finalDomains,
+        licenses: finalLicenses,
+      };
+
+      self.postMessage({ success: true, data, type: 'load' });
+    } catch (error: any) {
+      self.postMessage({
+        success: false,
+        error: error.message || 'Unknown error',
+        type: 'load',
+      });
+    }
+  } else if (message.type === 'filter') {
+    // Filter data based on criteria
+    const { data, criteria } = message;
+    const numModels = data.x.length;
+    const mask = new Uint8Array(numModels);
+
+    // Initialize all to 1 (included)
+    mask.fill(1);
+
+    // Filter by domain
+    if (criteria.domains && criteria.domains.length > 0) {
+      const domainSet = new Set(criteria.domains);
+      for (let i = 0; i < numModels; i++) {
+        const domain = data.domains[data.domainId[i]];
+        if (!domainSet.has(domain)) {
+          mask[i] = 0;
+        }
+      }
+    }
+
+    // Filter by license
+    if (criteria.licenses && criteria.licenses.length > 0) {
+      const licenseSet = new Set(criteria.licenses);
+      for (let i = 0; i < numModels; i++) {
+        const license = data.licenses[data.licenseId[i]];
+        if (!licenseSet.has(license)) {
+          mask[i] = 0;
+        }
+      }
+    }
+
+    // Filter by base model flag
+    if (criteria.isBaseModel !== undefined && criteria.isBaseModel !== null) {
+      for (let i = 0; i < numModels; i++) {
+        const isBase = (data.flags[i] & 0x01) !== 0;
+        if (isBase !== criteria.isBaseModel) {
+          mask[i] = 0;
+        }
+      }
+    }
+
+    // Count filtered models
+    const count = mask.reduce((sum, val) => sum + val, 0);
+
+    // Extract filtered data
+    const filteredX = new Float32Array(count);
+    const filteredY = new Float32Array(count);
+    const filteredZ = new Float32Array(count);
+    const filteredIndices: number[] = [];
+
+    let j = 0;
+    for (let i = 0; i < mask.length; i++) {
+      if (mask[i] === 1) {
+        filteredX[j] = data.x[i];
+        filteredY[j] = data.y[i];
+        filteredZ[j] = data.z[i];
+        filteredIndices.push(i);
+        j++;
+      }
+    }
+
+    self.postMessage({
+      success: true,
+      type: 'filter',
+      data: {
+        x: filteredX,
+        y: filteredY,
+        z: filteredZ,
+        indices: filteredIndices,
+        count,
+      },
+    });
+  }
+};
+
diff --git a/frontend/tsconfig.json b/frontend/tsconfig.json
index 5784c348f39936738491f64df421cb3e441e6c2f..fa1e19bfdf26abf3c62a5326a30baec1b4e6c843 100644
--- a/frontend/tsconfig.json
+++ b/frontend/tsconfig.json
@@ -21,7 +21,7 @@
     "jsx": "react-jsx"
   },
   "include": [
-    "src"
+    "src/**/*"
   ]
 }
 
diff --git a/pyrightconfig.json b/pyrightconfig.json
new file mode 100644
index 0000000000000000000000000000000000000000..48fc6732f0915d7f436e971c9f20b9a956cb0d8f
--- /dev/null
+++ b/pyrightconfig.json
@@ -0,0 +1,26 @@
+{
+  "include": [
+    "backend"
+  ],
+  "exclude": [
+    "**/__pycache__",
+    "**/node_modules"
+  ],
+  "executionEnvironments": [
+    {
+      "root": ".",
+      "pythonVersion": "3.13",
+      "pythonPlatform": "Darwin",
+      "extraPaths": [
+        "backend",
+        "venv/lib/python3.13/site-packages"
+      ],
+      "venvPath": ".",
+      "venv": "venv"
+    }
+  ],
+  "reportMissingImports": "warning",
+  "reportMissingTypeStubs": false,
+  "typeCheckingMode": "basic"
+}
+