updated answer_comparison prompt + small cleanup

2025-04-07 19:38:19 +02:00 · 2025-01-26 14:03:44 -08:00 · 2025-01-26 14:03:44 -08:00 · 9e9bd440f4
commit 9e9bd440f4
parent 7487b15522
3 changed files with 20 additions and 186 deletions
--- a/backend/onyx/agents/agent_search/deep_search_a/initial_search_sq_subgraph/nodes/ingest_initial_sub_question_answers.py
+++ b/backend/onyx/agents/agent_search/deep_search_a/initial_search_sq_subgraph/nodes/ingest_initial_sub_question_answers.py
@ -1,41 +0,0 @@
-from datetime import datetime
-
-from onyx.agents.agent_search.deep_search_a.answer_initial_sub_question.states import (
-    AnswerQuestionOutput,
-)
-from onyx.agents.agent_search.deep_search_a.main.operations import logger
-from onyx.agents.agent_search.deep_search_a.main.states import DecompAnswersUpdate
-from onyx.agents.agent_search.shared_graph_utils.operators import (
-    dedup_inference_sections,
-)
-
-
-def ingest_initial_sub_question_answers(
-    state: AnswerQuestionOutput,
-) -> DecompAnswersUpdate:
-    now_start = datetime.now()
-
-    logger.debug(f"--------{now_start}--------INGEST ANSWERS---")
-    documents = []
-    context_documents = []
-    answer_results = state.answer_results if hasattr(state, "answer_results") else []
-    for answer_result in answer_results:
-        documents.extend(answer_result.documents)
-        context_documents.extend(answer_result.context_documents)
-
-    now_end = datetime.now()
-
-    logger.debug(
-        f"--------{now_end}--{now_end - now_start}--------INGEST ANSWERS END---"
-    )
-
-    return DecompAnswersUpdate(
-        # Deduping is done by the documents operator for the main graph
-        # so we might not need to dedup here
-        documents=dedup_inference_sections(documents, []),
-        context_documents=dedup_inference_sections(context_documents, []),
-        decomp_answer_results=answer_results,
-        log_messages=[
-            f"{now_start} -- Main - Ingest initial processed sub questions,  Time taken: {now_end - now_start}"
-        ],
-    )
--- a/backend/onyx/agents/agent_search/deep_search_a/initial_search_sq_subgraph/nodes/initial_sub_question_creation.py
+++ b/backend/onyx/agents/agent_search/deep_search_a/initial_search_sq_subgraph/nodes/initial_sub_question_creation.py
@ -1,135 +0,0 @@
-from datetime import datetime
-from typing import cast
-
-from langchain_core.callbacks.manager import dispatch_custom_event
-from langchain_core.messages import HumanMessage
-from langchain_core.messages import merge_content
-from langchain_core.runnables import RunnableConfig
-
-from onyx.agents.agent_search.deep_search_a.initial_search_sq_subgraph.states import (
-    SearchSQState,
-)
-from onyx.agents.agent_search.deep_search_a.main.models import AgentRefinedMetrics
-from onyx.agents.agent_search.deep_search_a.main.operations import dispatch_subquestion
-from onyx.agents.agent_search.deep_search_a.main.operations import logger
-from onyx.agents.agent_search.deep_search_a.main.states import BaseDecompUpdate
-from onyx.agents.agent_search.models import AgentSearchConfig
-from onyx.agents.agent_search.shared_graph_utils.agent_prompt_ops import (
-    build_history_prompt,
-)
-from onyx.agents.agent_search.shared_graph_utils.prompts import (
-    INITIAL_DECOMPOSITION_PROMPT_QUESTIONS,
-)
-from onyx.agents.agent_search.shared_graph_utils.prompts import (
-    INITIAL_DECOMPOSITION_PROMPT_QUESTIONS_AFTER_SEARCH,
-)
-from onyx.agents.agent_search.shared_graph_utils.utils import dispatch_separated
-from onyx.chat.models import StreamStopInfo
-from onyx.chat.models import StreamStopReason
-from onyx.chat.models import SubQuestionPiece
-from onyx.configs.agent_configs import AGENT_NUM_DOCS_FOR_DECOMPOSITION
-
-
-def initial_sub_question_creation(
-    state: SearchSQState, config: RunnableConfig
-) -> BaseDecompUpdate:
-    now_start = datetime.now()
-
-    logger.debug(f"--------{now_start}--------BASE DECOMP START---")
-
-    agent_a_config = cast(AgentSearchConfig, config["metadata"]["config"])
-    question = agent_a_config.search_request.query
-    chat_session_id = agent_a_config.chat_session_id
-    primary_message_id = agent_a_config.message_id
-    perform_initial_search_decomposition = (
-        agent_a_config.perform_initial_search_decomposition
-    )
-    # perform_initial_search_path_decision = (
-    #     agent_a_config.perform_initial_search_path_decision
-    # )
-    history = build_history_prompt(agent_a_config.prompt_builder)
-
-    # Use the initial search results to inform the decomposition
-    sample_doc_str = state.sample_doc_str if hasattr(state, "sample_doc_str") else ""
-
-    if not chat_session_id or not primary_message_id:
-        raise ValueError(
-            "chat_session_id and message_id must be provided for agent search"
-        )
-    agent_start_time = datetime.now()
-
-    # Initial search to inform decomposition. Just get top 3 fits
-
-    if perform_initial_search_decomposition:
-        sample_doc_str = "\n\n".join(
-            [
-                doc.combined_content
-                for doc in state.exploratory_search_results[
-                    :AGENT_NUM_DOCS_FOR_DECOMPOSITION
-                ]
-            ]
-        )
-
-        decomposition_prompt = (
-            INITIAL_DECOMPOSITION_PROMPT_QUESTIONS_AFTER_SEARCH.format(
-                question=question, sample_doc_str=sample_doc_str, history=history
-            )
-        )
-
-    else:
-        decomposition_prompt = INITIAL_DECOMPOSITION_PROMPT_QUESTIONS.format(
-            question=question, history=history
-        )
-
-    # Start decomposition
-
-    msg = [HumanMessage(content=decomposition_prompt)]
-
-    # Get the rewritten queries in a defined format
-    model = agent_a_config.fast_llm
-
-    # Send the initial question as a subquestion with number 0
-    dispatch_custom_event(
-        "decomp_qs",
-        SubQuestionPiece(
-            sub_question=question,
-            level=0,
-            level_question_nr=0,
-        ),
-    )
-    # dispatches custom events for subquestion tokens, adding in subquestion ids.
-    streamed_tokens = dispatch_separated(model.stream(msg), dispatch_subquestion(0))
-
-    stop_event = StreamStopInfo(
-        stop_reason=StreamStopReason.FINISHED,
-        stream_type="sub_questions",
-        level=0,
-    )
-    dispatch_custom_event("stream_finished", stop_event)
-
-    deomposition_response = merge_content(*streamed_tokens)
-
-    # this call should only return strings. Commenting out for efficiency
-    # assert [type(tok) == str for tok in streamed_tokens]
-
-    # use no-op cast() instead of str() which runs code
-    # list_of_subquestions = clean_and_parse_list_string(cast(str, response))
-    list_of_subqs = cast(str, deomposition_response).split("\n")
-
-    decomp_list: list[str] = [sq.strip() for sq in list_of_subqs if sq.strip() != ""]
-
-    now_end = datetime.now()
-
-    logger.debug(f"--------{now_end}--{now_end - now_start}--------BASE DECOMP END---")
-
-    return BaseDecompUpdate(
-        initial_decomp_questions=decomp_list,
-        agent_start_time=agent_start_time,
-        agent_refined_start_time=None,
-        agent_refined_end_time=None,
-        agent_refined_metrics=AgentRefinedMetrics(
-            refined_doc_boost_factor=None,
-            refined_question_boost_factor=None,
-            duration__s=None,
-        ),
-    )
--- a/backend/onyx/agents/agent_search/shared_graph_utils/prompts.py
+++ b/backend/onyx/agents/agent_search/shared_graph_utils/prompts.py
@ -1053,24 +1053,34 @@ Please format your answer as a json object in the following format:

   """
 ANSWER_COMPARISON_PROMPT = """
-    For the given question, please compare the initial answer and the refined answer and determine if
+For the given question, please compare the initial answer and the refined answer and determine if
 the refined answer is substantially better than the initial answer. Better could mean:
 - additional information
 - more comprehensive information
 - more concise information
 - more structured information
+ - new bullet points
 - substantially more document citations ([[D1]](), [[D2]](), [[D3]](), etc.)

- Here is the question:
- {question}
+ Put yourself in the shoes of the user and think about whether the refined answer is really substantially
+ better than the initial answer.

- Here is the initial answer:
- {initial_answer}
+Here is the question:
+--
+{question}
+--

- Here is the refined answer:
- {refined_answer}
+Here is the initial answer:
+--
+{initial_answer}
+--

- With these criteria in mind, is the refined answer substantially better than the initial answer?
+Here is the refined answer:
+--
+{refined_answer}
+--

- Please answer with a simple 'yes' or 'no'.
-    """
+With these criteria in mind, is the refined answer substantially better than the initial answer?
+
+Please answer with a simple 'yes' or 'no'.
+"""