Spaces:

gkip
/

clinical_trial_inspector

Sleeping

Geoffrey Kip commited on 16 days ago

Commit

7b7595c

1 Parent(s): fc58768

Fix: Cache embedding model initialization to prevent concurrency crashes

Files changed (2) hide show

ct_agent_app.py CHANGED Viewed

@@ -22,7 +22,13 @@ logging.getLogger("langchain_google_genai._function_utils").setLevel(logging.ERR
 load_dotenv()
 # Module Imports
-from modules.utils import load_index, setup_llama_index
 from modules.constants import COUNTRY_COORDINATES, STATE_COORDINATES
 # ... (imports)
@@ -68,6 +74,9 @@ st.markdown(
     unsafe_allow_html=True,
 )
 st.title("🧬 Clinical Trial Inspector Agent")
 # 1. Setup LLM & LlamaIndex Settings

 load_dotenv()
 # Module Imports
+from modules.utils import (
+    load_environment,
+    load_index,
+    setup_llama_index,
+    init_embedding_model,
+    get_hybrid_retriever,
+)
 from modules.constants import COUNTRY_COORDINATES, STATE_COORDINATES
 # ... (imports)
     unsafe_allow_html=True,
 )
+# Initialize global resources (Embeddings) once
+init_embedding_model()
 st.title("🧬 Clinical Trial Inspector Agent")
 # 1. Setup LLM & LlamaIndex Settings

modules/utils.py CHANGED Viewed

@@ -118,29 +118,35 @@ def load_environment():
 # --- Configuration ---
 def setup_llama_index(api_key: Optional[str] = None):
     """
-    Configures global LlamaIndex settings (LLM and Embeddings).
     """
     # Use passed key, or fallback to env var
     final_key = api_key or os.environ.get("GOOGLE_API_KEY")
     if not final_key:
-        # App handles prompting for key, so we just return or log warning
-        pass
     try:
         # Pass the key explicitly if available
         Settings.llm = Gemini(model="models/gemini-2.5-flash", temperature=0, api_key=final_key)
     except Exception as e:
-        print(f"⚠️ LLM initialization failed (likely missing API key): {e}")
-        print("⚠️ Using MockLLM for testing/fallback.")
         from llama_index.core.llms import MockLLM
         Settings.llm = MockLLM()
-    Settings.embed_model = HuggingFaceEmbedding(
-        model_name="pritamdeka/S-PubMedBert-MS-MARCO"
-    )
 @st.cache_resource

 # --- Configuration ---
+@st.cache_resource
+def init_embedding_model():
+    """Initializes and caches the embedding model globally."""
+    Settings.embed_model = HuggingFaceEmbedding(
+        model_name="pritamdeka/S-PubMedBert-MS-MARCO",
+        device="cpu"
+    )
 def setup_llama_index(api_key: Optional[str] = None):
     """
+    Configures global LlamaIndex settings (LLM).
+    Embedding model is handled by init_embedding_model().
     """
+    # Ensure embedding model is loaded
+    init_embedding_model()
     # Use passed key, or fallback to env var
     final_key = api_key or os.environ.get("GOOGLE_API_KEY")
     if not final_key:
+        return
     try:
         # Pass the key explicitly if available
         Settings.llm = Gemini(model="models/gemini-2.5-flash", temperature=0, api_key=final_key)
     except Exception as e:
+        print(f"⚠️ LLM initialization failed: {e}")
         from llama_index.core.llms import MockLLM
         Settings.llm = MockLLM()
 @st.cache_resource