nlweb-ai · chelseacarter29 · Dec 18, 2025 · Sep 22, 2025 · Sep 29, 2025 · Sep 30, 2025
diff --git a/code/python/core/embedding.py b/code/python/core/embedding.py
@@ -272,10 +272,10 @@ async def batch_get_embeddings(
             # Gemini might not have a native batch API, so process one by one
             logger.debug("Getting Gemini batch embeddings (sequential)")
             from embedding_providers.gemini_embedding import get_gemini_batch_embeddings
-            # Process texts one by one with individual timeouts
+            # Process texts one by one - use longer timeout since sequential processing with rate limits
             result = await asyncio.wait_for(
                 get_gemini_batch_embeddings(texts, model=model_id),
-                timeout=30  # Individual timeout per text
+                timeout=timeout * len(texts)  # Scale timeout with batch size
             )
             logger.debug(f"Gemini batch embeddings received, count: {len(result)}")
             return result

diff --git a/code/python/core/ranking.py b/code/python/core/ranking.py
@@ -291,7 +291,7 @@ async def sendAnswers(self, answers, force=False):
                     self.handler.fastTrackWorked = True
 
                 # Use the new schema to create and auto-send the message
-                create_assistant_result(json_results, handler=self.handler)
+                await create_assistant_result(json_results, handler=self.handler)
                 self.num_results_sent += len(json_results)
             except (BrokenPipeError, ConnectionResetError) as e:
                 self.handler.connection_alive_event.clear()

diff --git a/code/python/core/schemas.py b/code/python/core/schemas.py
@@ -10,7 +10,6 @@
 from enum import Enum
 import uuid
 
-
 class SenderType(str, Enum):
     """Who sent the message."""
     USER = "user"
@@ -298,7 +297,7 @@ def create_user_message(query: str, site: Optional[str] = None, mode: Optional[s
     return message
 
 
-def create_assistant_result(results: List[Dict[str, Any]], 
+async def create_assistant_result(results: List[Dict[str, Any]], 
                            handler=None, 
                            metadata: Optional[Dict[str, Any]] = None,
                            send: bool = True) -> Message:
@@ -323,8 +322,7 @@ def create_assistant_result(results: List[Dict[str, Any]],
     )
 
     if send and handler:
-        import asyncio
-        asyncio.create_task(handler.send_message(message.to_dict()))
+        await handler.send_message(message.to_dict())
 
     return message
 
@@ -471,4 +469,4 @@ def create_legacy_message(message_type: str, content: Any,
     if sender_info:
         message["sender_info"] = sender_info
 
-    return message
+    return message
diff --git a/code/python/core/whoRanking.py b/code/python/core/whoRanking.py
@@ -13,12 +13,14 @@
 from misc.logger.logging_config_helper import get_configured_logger
 from core.schemas import create_assistant_result
 
+
 logger = get_configured_logger("who_ranking_engine")
 
 DEBUG_PRINT = False
 
 class WhoRanking:
 
+
     EARLY_SEND_THRESHOLD = 59
     NUM_RESULTS_TO_SEND = 10
 
@@ -29,6 +31,7 @@ def __init__(self, handler, items, level="high"): # default to low level for WHO
         self.items = items
         self.num_results_sent = 0
         self.rankedAnswers = []
+
 
 
     def get_ranking_prompt(self, query, site_description):
@@ -48,81 +51,107 @@ def get_ranking_prompt(self, query, site_description):
 
 The site's description is: {site_description}
 """
-        
+
         response_structure = {
             "score": "integer between 0 and 100",
             "description": "short description of why this site is relevant",
-            "query": "the optimized query to send to this site (only if score > 70)"
+            "query": "the optimized query to send to this site (only if score > 70)",
         }
-        
+
         return prompt, response_structure
 
     async def rankItem(self, url, json_str, name, site):
         """Rank a single site for relevance to the query."""
         try:
             description = trim_json(json_str)
-            prompt, ans_struc = self.get_ranking_prompt(self.handler.query, description)
-            ranking = await ask_llm(prompt, ans_struc, level=self.level, 
-                                    query_params=self.handler.query_params, timeout=8)
-
+            prompt, ans_struc = self.get_ranking_prompt(
+                self.handler.query, description
+            )
+            ranking = await ask_llm(
+                prompt,
+                ans_struc,
+                level=self.level,
+                query_params=self.handler.query_params,
+                timeout=90,
-                timeout=90,
+                timeout=30,
-                timeout=90,
+                timeout=30,
+            )
+
             # Ensure ranking has required fields (handle LLM failures/timeouts)
             if not ranking or not isinstance(ranking, dict):
-                ranking = {"score": 0, "description": "Failed to rank", "query": self.handler.query}
+                ranking = {
+                    "score": 0,
+                    "description": "Failed to rank",
+                    "query": self.handler.query,
+                }
             if "score" not in ranking:
                 ranking["score"] = 0
             if "query" not in ranking:
                 ranking["query"] = self.handler.query
-            
+
             # Log the LLM score
             # LLM Score recorded
-            
+
             # Handle both string and dictionary inputs for json_str
-            schema_object = json_str if isinstance(json_str, dict) else json.loads(json_str)
-
+            schema_object = (
+                json_str if isinstance(json_str, dict) else json.loads(json_str)
+            )
+
             # Store the result
             ansr = {
-                'url': url,
-                'site': site,
-                'name': name,
-                'ranking': ranking,
-                'schema_object': schema_object,
-                'sent': False,
+                "url": url,
+                "site": site,
+                "name": name,
+                "ranking": ranking,
+                "schema_object": schema_object,
+                "sent": False,
             }
-            
+
             # Send immediately if high score
             if ranking.get("score", 0) > self.EARLY_SEND_THRESHOLD:
-                logger.info(f"High score site: {name} (score: {ranking['score']}) - sending early")
+                logger.info(
+                    f"High score site: {name} (score: {ranking['score']}) - sending early"
+                )
                 await self.sendAnswers([ansr])
-            
+
             self.rankedAnswers.append(ansr)
             logger.debug(f"Site {name} added to ranked answers")
-        
+
         except Exception as e:
             logger.error(f"Error in rankItem for {name}: {str(e)}")
             logger.debug(f"Full error trace: ", exc_info=True)
             # Still add the item with a zero score so we don't lose it completely
             try:
-                schema_object = json_str if isinstance(json_str, dict) else json.loads(json_str)
+                schema_object = (
+                    json_str if isinstance(json_str, dict) else json.loads(json_str)
+                )
                 ansr = {
-                    'url': url,
-                    'site': site,
-                    'name': name,
-                    'ranking': {"score": 0, "description": f"Error: {str(e)}", "query": self.handler.query},
-                    'schema_object': schema_object,
-                    'sent': False,
+                    "url": url,
+                    "site": site,
+                    "name": name,
+                    "ranking": {
+                        "score": 0,
+                        "description": f"Error: {str(e)}",
+                        "query": self.handler.query,
+                    },
+                    "schema_object": schema_object,
+                    "sent": False,
                 }
                 self.rankedAnswers.append(ansr)
             except:
                 pass  # Skip this item entirely if we can't even create a basic record
 
     async def sendAnswers(self, answers, force=False):
         """Send ranked sites to the client."""
+        # Get max_results from handler, or use default
+        max_results = getattr(self.handler, 'max_results', self.NUM_RESULTS_TO_SEND)
         json_results = []
 
+
         for result in answers:
             # Stop if we've already sent enough
-            if self.num_results_sent + len(json_results) >= self.NUM_RESULTS_TO_SEND:
-                logger.info(f"Stopping at {len(json_results)} results to avoid exceeding limit of {self.NUM_RESULTS_TO_SEND}")
+            if self.num_results_sent + len(json_results) >= max_results:
+                logger.info(
+                    f"Stopping at {len(json_results)} results to avoid exceeding limit of {max_results}"
+                )
                 break
 
             # Extract site type from schema_object
@@ -143,24 +172,34 @@ async def sendAnswers(self, answers, force=False):
                 "@type": site_type,  # Use the actual site type
                 "url": complete_url,  # Use the complete URL with gateway
                 "name": result["name"],
-                "score": result["ranking"]["score"]
+                "score": result["ranking"]["score"],
             }
 
+
             # Include description if available
             if "description" in result["ranking"]:
                 result_item["description"] = result["ranking"]["description"]
 
+            # Always include query field (required for WHO ranking)
+            if "query" in result["ranking"]:
+                result_item["query"] = result["ranking"]["query"]
+            else:
+                # Fallback to original query if no custom query provided
+                result_item["query"] = self.handler.query
+
+
-            # Always include query field (required for WHO ranking)
-            if "query" in result["ranking"]:
-                result_item["query"] = result["ranking"]["query"]
-            else:
-                # Fallback to original query if no custom query provided
-                result_item["query"] = self.handler.query
-            # Always include query field (required for WHO ranking)
-            if "query" in result["ranking"]:
-                result_item["query"] = result["ranking"]["query"]
-            else:
-                # Fallback to original query if no custom query provided
-                result_item["query"] = self.handler.query
             # Include optimized query field (for display purposes)
             result_item["query"] = site_query
 
             json_results.append(result_item)
             result["sent"] = True
-
         if json_results:
             # Use the new schema to create and auto-send the message
-            create_assistant_result(json_results, handler=self.handler)
+            await create_assistant_result(json_results, handler=self.handler)
             self.num_results_sent += len(json_results)
-            logger.info(f"Sent {len(json_results)} results, total sent: {self.num_results_sent}/{self.NUM_RESULTS_TO_SEND}")
+            logger.info(
+                f"Sent {len(json_results)} results, total sent: {self.num_results_sent}/{max_results}"
+            )
 
     async def do(self):
         """Main execution method - rank all sites concurrently."""
@@ -169,69 +208,37 @@ async def do(self):
         tasks = []
         for url, json_str, name, site in self.items:
             tasks.append(asyncio.create_task(self.rankItem(url, json_str, name, site)))
-        
+
         # Wait for all ranking tasks to complete
         try:
             await asyncio.gather(*tasks, return_exceptions=True)
         except Exception as e:
             logger.error(f"Error during ranking tasks: {str(e)}")
-
-        # Filter and sort final results
-        filtered = [r for r in self.rankedAnswers if r.get('ranking', {}).get('score', 0) > 70]
+
+        # Use min_score from handler if available, otherwise default to 51
+        min_score_threshold = getattr(self.handler, 'min_score', 51)
-        # Use min_score from handler if available, otherwise default to 51
-        min_score_threshold = getattr(self.handler, 'min_score', 51)
+        # Use min_score from handler if available, otherwise default to 70 (backward compatible)
+        min_score_threshold = getattr(self.handler, 'min_score', 70)
-        # Use min_score from handler if available, otherwise default to 51
-        min_score_threshold = getattr(self.handler, 'min_score', 51)
+        # Use min_score from handler if available, otherwise default to 70 (backward compatible)
+        min_score_threshold = getattr(self.handler, 'min_score', 70)
+        # Use max_results from handler if available, otherwise use NUM_RESULTS_TO_SEND
+        max_results = getattr(self.handler, 'max_results', self.NUM_RESULTS_TO_SEND)
+        filtered = [r for r in self.rankedAnswers if r.get('ranking', {}).get('score', 0) > min_score_threshold]
         ranked = sorted(filtered, key=lambda x: x.get('ranking', {}).get("score", 0), reverse=True)
-        self.handler.final_ranked_answers = ranked[:self.NUM_RESULTS_TO_SEND]
-
-        if (DEBUG_PRINT):
-            print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > 70 ===")
-
-            # Print the ranked sites with scores
-            print("\nRanked sites (top 10):")
-            for i, r in enumerate(ranked[:self.NUM_RESULTS_TO_SEND], 1):
-                score = r.get('ranking', {}).get('score', 0)
-                print(f"  {i}. {r['name']} - Score: {score}")
-            print("=" * 60)
-
-            # Print sites that were not returned
-            print("\n=== SITES NOT RETURNED (sorted by score) ===")
-
-            # Get all sites that were not included in the top 10
-            not_returned_high_score = ranked[self.NUM_RESULTS_TO_SEND:]  # Sites with score > 70 but beyond top 10
-            not_returned_low_score = [r for r in self.rankedAnswers if r.get('ranking', {}).get('score', 0) <= 70]
-
-            # Sort low score sites by score (descending)
-            not_returned_low_score = sorted(not_returned_low_score,
-                                       key=lambda x: x.get('ranking', {}).get("score", 0),
-                                       reverse=True)
-
-            # Combine both lists
-            all_not_returned = not_returned_high_score + not_returned_low_score
-
-            if all_not_returned:
-                print(f"\nTotal sites not returned: {len(all_not_returned)}")
-
-            # Print sites with score > 70 that didn't make top 10
-                if not_returned_high_score:
-                    print(f"\nSites with score > 70 but beyond top {self.NUM_RESULTS_TO_SEND}:")
-                    for i, r in enumerate(not_returned_high_score, 1):
-                        score = r.get('ranking', {}).get('score', 0)
-                        print(f"  {i}. {r['name']} - Score: {score}")
-
-            # Print sites with score <= 70
-                if not_returned_low_score:
-                    print(f"\nSites with score <= 70:")
-                    for i, r in enumerate(not_returned_low_score, 1):
-                        score = r.get('ranking', {}).get('score', 0)
-                        print(f"  {i}. {r['name']} - Score: {score}")
-            else:
-                print("All retrieved sites were returned to the user.")
+        self.handler.final_ranked_answers = ranked[:max_results]
+
+        print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > {min_score_threshold} ===")
+
+        # Print the ranked sites with scores
+        print("\nRanked sites (top 10):")
+        for i, r in enumerate(ranked[:max_results], 1):
+            score = r.get('ranking', {}).get('score', 0)
+            print(f"  {i}. {r['name']} - Score: {score}")
+        print("=" * 60)
-        print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > {min_score_threshold} ===")
-
-        # Print the ranked sites with scores
-        print("\nRanked sites (top 10):")
-        for i, r in enumerate(ranked[:max_results], 1):
-            score = r.get('ranking', {}).get('score', 0)
-            print(f"  {i}. {r['name']} - Score: {score}")
-        print("=" * 60)
+        if DEBUG_PRINT:
+            print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > {min_score_threshold} ===")
+
+            # Print the ranked sites with scores
+            print("\nRanked sites (top 10):")
+            for i, r in enumerate(ranked[:max_results], 1):
+                score = r.get('ranking', {}).get('score', 0)
+                print(f"  {i}. {r['name']} - Score: {score}")
+            print("=" * 60)
-        print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > {min_score_threshold} ===")
-
-        # Print the ranked sites with scores
-        print("\nRanked sites (top 10):")
-        for i, r in enumerate(ranked[:max_results], 1):
-            score = r.get('ranking', {}).get('score', 0)
-            print(f"  {i}. {r['name']} - Score: {score}")
-        print("=" * 60)
+        if DEBUG_PRINT:
+            print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > {min_score_threshold} ===")
+
+            # Print the ranked sites with scores
+            print("\nRanked sites (top 10):")
+            for i, r in enumerate(ranked[:max_results], 1):
+                score = r.get('ranking', {}).get('score', 0)
+                print(f"  {i}. {r['name']} - Score: {score}")
+            print("=" * 60)
 
-            print("=" * 60)
-
         # Final ranked results processed
-        
+
         # Send any remaining results that haven't been sent
-        results_to_send = [r for r in ranked if not r['sent']][:self.NUM_RESULTS_TO_SEND - self.num_results_sent]
-
+        results_to_send = [r for r in ranked if not r["sent"]][
+            : max_results - self.num_results_sent
+        ]
+
         if results_to_send:
             logger.info(f"Sending final batch of {len(results_to_send)} results")
-            await self.sendAnswers(results_to_send, force=True)
+            await self.sendAnswers(results_to_send, force=True)
diff --git a/code/python/embedding_providers/gemini_embedding.py b/code/python/embedding_providers/gemini_embedding.py
@@ -13,6 +13,10 @@
 import threading
 from typing import List, Optional
 import time
+import logging
+
+# Suppress gRPC ALTS credentials warning (not running on GCP)
+logging.getLogger("grpc").setLevel(logging.ERROR)
 
 import google.generativeai as genai
 from core.config import CONFIG

diff --git a/static/who.html b/static/who.html
@@ -382,11 +382,20 @@ <h1>Agent Finder</h1>
             this.eventSource.close();
           }
 
+          const debugParams = new URLSearchParams(window.location.search);
+          const queryObj = Object.fromEntries(debugParams.entries());
+
-          const debugParams = new URLSearchParams(window.location.search);
-          const queryObj = Object.fromEntries(debugParams.entries());
-          const debugParams = new URLSearchParams(window.location.search);
-          const queryObj = Object.fromEntries(debugParams.entries());
           // Create URL with query parameters
           const params = new URLSearchParams({
             query: query,
             streaming: 'true'  // Use streaming mode
           });
+
+          // Add previous queries for context (limit to last 3 queries)
-          // Add previous queries for context (limit to last 3 queries)
+          // Add previous queries for context (limit to last 3 queries)
+          if (!Array.isArray(this.queryHistory)) {
+            this.queryHistory = [];
+          }
-          // Add previous queries for context (limit to last 3 queries)
+          // Add previous queries for context (limit to last 3 queries)
+          if (!Array.isArray(this.queryHistory)) {
+            this.queryHistory = [];
+          }
+          if (this.queryHistory.length > 0) {
+            const recentQueries = this.queryHistory.slice(-3);
+            params.append('prev_queries', JSON.stringify(recentQueries));
+          }
 
           const url = `/who?${params.toString()}`;