nlweb-ai · zach-2pir · Sep 22, 2025 · Sep 29, 2025 · Sep 30, 2025 · Sep 30, 2025
diff --git a/code/python/core/ranking.py b/code/python/core/ranking.py
@@ -311,7 +311,7 @@ async def sendAnswers(self, answers, force=False):
                     logger.info("Fast track ranking successful")
 
                 # Use the new schema to create and auto-send the message
-                create_assistant_result(json_results, handler=self.handler)
+                await create_assistant_result(json_results, handler=self.handler)
                 self.num_results_sent += len(json_results)
                 logger.info(f"Sent {len(json_results)} results, total sent: {self.num_results_sent}/{max_results}")
             except (BrokenPipeError, ConnectionResetError) as e:

diff --git a/code/python/core/schemas.py b/code/python/core/schemas.py
@@ -10,7 +10,6 @@
 from enum import Enum
 import uuid
 
-
 class SenderType(str, Enum):
     """Who sent the message."""
     USER = "user"
@@ -298,7 +297,7 @@ def create_user_message(query: str, site: Optional[str] = None, mode: Optional[s
     return message
 
 
-def create_assistant_result(results: List[Dict[str, Any]], 
+async def create_assistant_result(results: List[Dict[str, Any]], 
                            handler=None, 
                            metadata: Optional[Dict[str, Any]] = None,
                            send: bool = True) -> Message:
@@ -323,8 +322,7 @@ def create_assistant_result(results: List[Dict[str, Any]],
     )
 
     if send and handler:
-        import asyncio
-        asyncio.create_task(handler.send_message(message.to_dict()))
+        await handler.send_message(message.to_dict())
 
     return message
 
@@ -471,4 +469,4 @@ def create_legacy_message(message_type: str, content: Any,
     if sender_info:
         message["sender_info"] = sender_info
 
-    return message
+    return message
diff --git a/code/python/core/whoRanking.py b/code/python/core/whoRanking.py
@@ -13,11 +13,12 @@
 from misc.logger.logging_config_helper import get_configured_logger
 from core.schemas import create_assistant_result
 
+
 logger = get_configured_logger("who_ranking_engine")
 
 
 class WhoRanking:
-    
+
     EARLY_SEND_THRESHOLD = 59
     NUM_RESULTS_TO_SEND = 10
 
@@ -28,7 +29,7 @@ def __init__(self, handler, items, level="low"):
         self.items = items
         self.num_results_sent = 0
         self.rankedAnswers = []
-
+    
     def get_ranking_prompt(self, query, site_description):
         """Construct the WHO ranking prompt with the given query and site description."""
         prompt = f"""Assign a score between 0 and 100 to the following site based 
@@ -40,113 +41,139 @@ def get_ranking_prompt(self, query, site_description):
 
 The site's description is: {site_description}
 """
-        
+
         response_structure = {
             "score": "integer between 0 and 100",
             "description": "short description of why this site is relevant",
-            "query": "the optimized query to send to this site (only if score > 70)"
+            "query": "the optimized query to send to this site (only if score > 70)",
         }
-        
+
         return prompt, response_structure
 
     async def rankItem(self, url, json_str, name, site):
         """Rank a single site for relevance to the query."""
         try:
             description = trim_json(json_str)
-            prompt, ans_struc = self.get_ranking_prompt(self.handler.query, description)
-            ranking = await ask_llm(prompt, ans_struc, level=self.level, 
-                                    query_params=self.handler.query_params, timeout=90)
-
+            prompt, ans_struc = self.get_ranking_prompt(
+                self.handler.query, description
+            )
+            ranking = await ask_llm(
+                prompt,
+                ans_struc,
+                level=self.level,
+                query_params=self.handler.query_params,
+                timeout=90,
+            )
+
             # Ensure ranking has required fields (handle LLM failures/timeouts)
             if not ranking or not isinstance(ranking, dict):
-                ranking = {"score": 0, "description": "Failed to rank", "query": self.handler.query}
+                ranking = {
+                    "score": 0,
+                    "description": "Failed to rank",
+                    "query": self.handler.query,
+                }
             if "score" not in ranking:
                 ranking["score"] = 0
             if "query" not in ranking:
                 ranking["query"] = self.handler.query
-            
+
             # Log the LLM score
             # LLM Score recorded
-            
+
             # Handle both string and dictionary inputs for json_str
-            schema_object = json_str if isinstance(json_str, dict) else json.loads(json_str)
-
+            schema_object = (
+                json_str if isinstance(json_str, dict) else json.loads(json_str)
+            )
+
             # Store the result
             ansr = {
-                'url': url,
-                'site': site,
-                'name': name,
-                'ranking': ranking,
-                'schema_object': schema_object,
-                'sent': False,
+                "url": url,
+                "site": site,
+                "name": name,
+                "ranking": ranking,
+                "schema_object": schema_object,
+                "sent": False,
             }
-            
+
             # Send immediately if high score
             if ranking.get("score", 0) > self.EARLY_SEND_THRESHOLD:
-                logger.info(f"High score site: {name} (score: {ranking['score']}) - sending early")
+                logger.info(
+                    f"High score site: {name} (score: {ranking['score']}) - sending early"
+                )
                 await self.sendAnswers([ansr])
-            
+
             self.rankedAnswers.append(ansr)
             logger.debug(f"Site {name} added to ranked answers")
-        
+
         except Exception as e:
             logger.error(f"Error in rankItem for {name}: {str(e)}")
             logger.debug(f"Full error trace: ", exc_info=True)
             # Still add the item with a zero score so we don't lose it completely
             try:
-                schema_object = json_str if isinstance(json_str, dict) else json.loads(json_str)
+                schema_object = (
+                    json_str if isinstance(json_str, dict) else json.loads(json_str)
+                )
                 ansr = {
-                    'url': url,
-                    'site': site,
-                    'name': name,
-                    'ranking': {"score": 0, "description": f"Error: {str(e)}", "query": self.handler.query},
-                    'schema_object': schema_object,
-                    'sent': False,
+                    "url": url,
+                    "site": site,
+                    "name": name,
+                    "ranking": {
+                        "score": 0,
+                        "description": f"Error: {str(e)}",
+                        "query": self.handler.query,
+                    },
+                    "schema_object": schema_object,
+                    "sent": False,
                 }
                 self.rankedAnswers.append(ansr)
             except:
                 pass  # Skip this item entirely if we can't even create a basic record
 
     async def sendAnswers(self, answers, force=False):
         """Send ranked sites to the client."""
+        # Get max_results from handler, or use default
+        max_results = getattr(self.handler, 'max_results', self.NUM_RESULTS_TO_SEND)
         json_results = []
-        
+
         for result in answers:
             # Stop if we've already sent enough
-            if self.num_results_sent + len(json_results) >= self.NUM_RESULTS_TO_SEND:
-                logger.info(f"Stopping at {len(json_results)} results to avoid exceeding limit of {self.NUM_RESULTS_TO_SEND}")
+            if self.num_results_sent + len(json_results) >= max_results:
+                logger.info(
+                    f"Stopping at {len(json_results)} results to avoid exceeding limit of {max_results}"
+                )
                 break
-            
+
             # Extract site type from schema_object
             schema_obj = result.get("schema_object", {})
             site_type = schema_obj.get("@type", "Website")
-            
+
             result_item = {
                 "@type": site_type,  # Use the actual site type
                 "url": result["url"],
                 "name": result["name"],
-                "score": result["ranking"]["score"]
+                "score": result["ranking"]["score"],
             }
-            
+
             # Include description if available
             if "description" in result["ranking"]:
                 result_item["description"] = result["ranking"]["description"]
-            
+
             # Always include query field (required for WHO ranking)
             if "query" in result["ranking"]:
                 result_item["query"] = result["ranking"]["query"]
             else:
                 # Fallback to original query if no custom query provided
                 result_item["query"] = self.handler.query
-            
+
             json_results.append(result_item)
             result["sent"] = True
-
         if json_results:
             # Use the new schema to create and auto-send the message
-            create_assistant_result(json_results, handler=self.handler)
+            await create_assistant_result(json_results, handler=self.handler)
             self.num_results_sent += len(json_results)
-            logger.info(f"Sent {len(json_results)} results, total sent: {self.num_results_sent}/{self.NUM_RESULTS_TO_SEND}")
+            logger.info(
+                f"Sent {len(json_results)} results, total sent: {self.num_results_sent}/{max_results}"
+            )
 
     async def do(self):
         """Main execution method - rank all sites concurrently."""
@@ -155,32 +182,37 @@ async def do(self):
         tasks = []
         for url, json_str, name, site in self.items:
             tasks.append(asyncio.create_task(self.rankItem(url, json_str, name, site)))
-        
+
         # Wait for all ranking tasks to complete
         try:
             await asyncio.gather(*tasks, return_exceptions=True)
         except Exception as e:
             logger.error(f"Error during ranking tasks: {str(e)}")
-
-        # Filter and sort final results
-        filtered = [r for r in self.rankedAnswers if r.get('ranking', {}).get('score', 0) > 70]
+
+        # Use min_score from handler if available, otherwise default to 51
+        min_score_threshold = getattr(self.handler, 'min_score', 51)
+        # Use max_results from handler if available, otherwise use NUM_RESULTS_TO_SEND
+        max_results = getattr(self.handler, 'max_results', self.NUM_RESULTS_TO_SEND)
+        filtered = [r for r in self.rankedAnswers if r.get('ranking', {}).get('score', 0) > min_score_threshold]
         ranked = sorted(filtered, key=lambda x: x.get('ranking', {}).get("score", 0), reverse=True)
-        self.handler.final_ranked_answers = ranked[:self.NUM_RESULTS_TO_SEND]
-        
-        print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > 70 ===")
-        
+        self.handler.final_ranked_answers = ranked[:max_results]
+
+        print(f"\n=== WHO RANKING: Filtered to {len(filtered)} results with score > {min_score_threshold} ===")
+
         # Print the ranked sites with scores
         print("\nRanked sites (top 10):")
-        for i, r in enumerate(ranked[:self.NUM_RESULTS_TO_SEND], 1):
+        for i, r in enumerate(ranked[:max_results], 1):
             score = r.get('ranking', {}).get('score', 0)
             print(f"  {i}. {r['name']} - Score: {score}")
         print("=" * 60)
-        
+
         # Final ranked results processed
-        
+
         # Send any remaining results that haven't been sent
-        results_to_send = [r for r in ranked if not r['sent']][:self.NUM_RESULTS_TO_SEND - self.num_results_sent]
-
+        results_to_send = [r for r in ranked if not r["sent"]][
+            : max_results - self.num_results_sent
+        ]
+
         if results_to_send:
             logger.info(f"Sending final batch of {len(results_to_send)} results")
-            await self.sendAnswers(results_to_send, force=True)
+            await self.sendAnswers(results_to_send, force=True)
diff --git a/static/who.html b/static/who.html
@@ -386,10 +386,14 @@ <h1>Agent Finder</h1>
             this.eventSource.close();
           }
 
+          const debugParams = new URLSearchParams(window.location.search);
+          const queryObj = Object.fromEntries(debugParams.entries());
+
           // Create URL with query parameters including previous queries
           const params = new URLSearchParams({
             query: query,
-            streaming: 'true'  // Use streaming mode
+            streaming: 'true',  // Use streaming mode
+            ...queryObj  // Preserve other URL params (like retrieval, db, etc.)
           });
 
           // Add previous queries for context (limit to last 3 queries)