ferdinandl007
diff --git a/‎backend/onyx/context/search/utils.py‎
Lines changed: 5 additions & 1 deletion b/‎backend/onyx/context/search/utils.py‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎backend/tests/regression/search_quality/README.md‎
Lines changed: 56 additions & 0 deletions b/‎backend/tests/regression/search_quality/README.md‎
Lines changed: 56 additions & 0 deletions
diff --git a/‎backend/tests/regression/search_quality/generate_search_queries.py‎
Lines changed: 124 additions & 0 deletions b/‎backend/tests/regression/search_quality/generate_search_queries.py‎
Lines changed: 124 additions & 0 deletions
@@ -12,6 +12,9 @@
 from onyx.context.search.models import SavedSearchDocWithContent
 from onyx.context.search.models import SearchDoc
 from onyx.db.models import SearchDoc as DBSearchDoc
+from onyx.utils.logger import setup_logger
+
+logger = setup_logger()
 
 
 T = TypeVar(
@@ -154,5 +157,6 @@ def remove_stop_words_and_punctuation(keywords: list[str]) -> list[str]:
             if (word.casefold() not in stop_words and word not in string.punctuation)
         ]
         return text_trimmed or word_tokens
-    except Exception:
+    except Exception as e:
+        logger.warning(f"Error removing stop words and punctuation: {e}")
         return keywords
@@ -0,0 +1,56 @@
+# Search Quality Test Script
+
+This Python script evaluates the search results for a list of queries.
+
+Unlike the script in answer_quality, this script is much less customizable and runs using currently ingested documents, though it allows for quick testing of search parameters on a bunch of test queries that don't have well-defined answers.
+
+## Usage
+
+1. Ensure you have the required dependencies installed and onyx running.
+
+2. Ensure a reranker model is configured in the search settings.
+This can be checked/modified by opening the admin panel, going to search settings, and ensuring a reranking model is set.
+
+3. Set up the PYTHONPATH permanently:
+   Add the following line to your shell configuration file (e.g., `~/.bashrc`, `~/.zshrc`, or `~/.bash_profile`):
+   ```
+   export PYTHONPATH=$PYTHONPATH:/path/to/onyx/backend
+   ```
+   Replace `/path/to/onyx` with the actual path to your Onyx repository.
+   After adding this line, restart your terminal or run `source ~/.bashrc` (or the appropriate config file) to apply the changes.
+
+4. Navigate to Onyx repo, search_quality folder:
+
+```
+cd path/to/onyx/backend/tests/regression/search_quality
+```
+
+5. Copy `search_queries.json.template` to `search_queries.json` and add/remove test queries in it
+
+6. Run `generate_search_queries.py` to generate the modified queries for the search pipeline
+
+```
+python generate_search_queries.py
+```
+
+7. Copy `search_eval_config.yaml.template` to `search_eval_config.yaml` and specify the search and eval parameters
+8. Run `run_search_eval.py` to evaluate the search results against the reranked results
+
+```
+python run_search_eval.py
+```
+
+9. Repeat steps 7 and 8 to test and compare different search parameters
+
+## Metrics
+- Jaccard Similarity: the ratio between the intersect and the union between the topk search and rerank results. Higher is better
+- Average Rank Change: The average absolute rank difference of the topk reranked chunks vs the entire search chunks. Lower is better
+- Average Missing Chunk Ratio: The number of chunks in the topk reranked chunks not in the topk search chunks, over topk. Lower is better
+
+Note that all of these metrics are affected by very narrow search results.
+E.g., if topk is 20 but there is only 1 relevant document, the other 19 documents could be ordered arbitrarily, resulting in a lower score.
+
+
+To address this limitation, there are score adjusted versions of the metrics.
+The score adjusted version does not use a fixed topk, but computes the optimum topk based on the rerank scores.
+This generally works in determining how many documents are relevant, although note that this approach isn't perfect.
@@ -0,0 +1,124 @@
+import json
+from pathlib import Path
+
+from langgraph.types import StreamWriter
+
+from onyx.agents.agent_search.basic.utils import process_llm_stream
+from onyx.chat.models import PromptConfig
+from onyx.chat.prompt_builder.answer_prompt_builder import AnswerPromptBuilder
+from onyx.chat.prompt_builder.answer_prompt_builder import default_build_system_message
+from onyx.chat.prompt_builder.answer_prompt_builder import default_build_user_message
+from onyx.configs.app_configs import POSTGRES_API_SERVER_POOL_OVERFLOW
+from onyx.configs.app_configs import POSTGRES_API_SERVER_POOL_SIZE
+from onyx.configs.constants import DEFAULT_PERSONA_ID
+from onyx.db.engine import get_session_with_current_tenant
+from onyx.db.engine import SqlEngine
+from onyx.db.persona import get_persona_by_id
+from onyx.llm.factory import get_llms_for_persona
+from onyx.llm.interfaces import LLM
+from onyx.tools.tool_implementations.search.search_tool import SearchTool
+from onyx.tools.utils import explicit_tool_calling_supported
+from onyx.utils.logger import setup_logger
+
+logger = setup_logger()
+
+
+def _load_queries() -> list[str]:
+    current_dir = Path(__file__).parent
+    with open(current_dir / "search_queries.json", "r") as file:
+        return json.load(file)
+
+
+def _modify_one_query(
+    query: str,
+    llm: LLM,
+    prompt_config: PromptConfig,
+    tool_definition: dict,
+    writer: StreamWriter = lambda _: None,
+) -> str:
+    prompt_builder = AnswerPromptBuilder(
+        user_message=default_build_user_message(
+            user_query=query,
+            prompt_config=prompt_config,
+            files=[],
+            single_message_history=None,
+        ),
+        system_message=default_build_system_message(prompt_config, llm.config),
+        message_history=[],
+        llm_config=llm.config,
+        raw_user_query=query,
+        raw_user_uploaded_files=[],
+        single_message_history=None,
+    )
+    prompt = prompt_builder.build()
+
+    stream = llm.stream(
+        prompt=prompt,
+        tools=[tool_definition],
+        tool_choice="required",
+        structured_response_format=None,
+    )
+    tool_message = process_llm_stream(
+        messages=stream,
+        should_stream_answer=False,
+        writer=writer,
+    )
+    return (
+        tool_message.tool_calls[0]["args"]["query"]
+        if tool_message.tool_calls
+        else query
+    )
+
+
+class SearchToolOverride(SearchTool):
+    def __init__(self) -> None:
+        # do nothing, the tool_definition function doesn't require variables to be initialized
+        pass
+
+
+def generate_search_queries() -> None:
+    SqlEngine.init_engine(
+        pool_size=POSTGRES_API_SERVER_POOL_SIZE,
+        max_overflow=POSTGRES_API_SERVER_POOL_OVERFLOW,
+    )
+
+    queries = _load_queries()
+
+    with get_session_with_current_tenant() as db_session:
+        persona = get_persona_by_id(DEFAULT_PERSONA_ID, None, db_session)
+        llm, _ = get_llms_for_persona(persona)
+        prompt_config = PromptConfig.from_model(persona.prompts[0])
+        tool_definition = SearchToolOverride().tool_definition()
+
+        tool_call_supported = explicit_tool_calling_supported(
+            llm.config.model_provider, llm.config.model_name
+        )
+
+        if tool_call_supported:
+            logger.info(
+                "Tool calling is supported for the current model. Modifying queries."
+            )
+            modified_queries = [
+                _modify_one_query(
+                    query=query,
+                    llm=llm,
+                    prompt_config=prompt_config,
+                    tool_definition=tool_definition,
+                )
+                for query in queries
+            ]
+        else:
+            logger.warning(
+                "Tool calling is not supported for the current model. "
+                "Using the original queries."
+            )
+            modified_queries = queries
+
+        with open("search_queries_modified.json", "w") as file:
+            json.dump(modified_queries, file, indent=4)
+
+    logger.info("Exported modified queries to search_queries_modified.json")
+
+
+if __name__ == "__main__":
+    generate_search_queries()