Yuhong

2025-09-23 12:31:30 +02:00 · 2025-02-02 16:14:18 -08:00
parent a067b32467
commit 506a9f1b94
6 changed files with 149 additions and 125 deletions
--- a/backend/onyx/agents/agent_search/deep_search/main/nodes/extract_entities_terms.py
+++ b/backend/onyx/agents/agent_search/deep_search/main/nodes/extract_entities_terms.py
@@ -23,9 +23,8 @@ from onyx.agents.agent_search.shared_graph_utils.utils import (
    get_langgraph_node_log_string,
 )
 from onyx.configs.constants import NUM_EXPLORATORY_DOCS
-from onyx.prompts.agent_search import (
+from onyx.prompts.agent_search import ENTITY_TERM_EXTRACTION_PROMPT
-    ENTITY_TERM_EXTRACTION_PROMPT,
+from onyx.prompts.agent_search import ENTITY_TERM_EXTRACTION_PROMPT_JSON_EXAMPLE
 )
 def extract_entities_terms(
@@ -58,16 +57,21 @@ def extract_entities_terms(
    # start with the entity/term/extraction
    doc_context = format_docs(initial_search_docs)
    # Calculation here is only approximate
    doc_context = trim_prompt_piece(
        graph_config.tooling.fast_llm.config,
        doc_context,
-        ENTITY_TERM_EXTRACTION_PROMPT + question,
+        ENTITY_TERM_EXTRACTION_PROMPT
        + question
        + ENTITY_TERM_EXTRACTION_PROMPT_JSON_EXAMPLE,
    )
    msg = [
        HumanMessage(
            content=ENTITY_TERM_EXTRACTION_PROMPT.format(
                question=question, context=doc_context
-            ),
+            )
            + ENTITY_TERM_EXTRACTION_PROMPT_JSON_EXAMPLE,
        )
    ]
    fast_llm = graph_config.tooling.fast_llm
--- a/backend/onyx/agents/agent_search/shared_graph_utils/agent_prompt_ops.py
+++ b/backend/onyx/agents/agent_search/shared_graph_utils/agent_prompt_ops.py
@@ -13,6 +13,7 @@ from onyx.agents.agent_search.shared_graph_utils.utils import (
 from onyx.agents.agent_search.shared_graph_utils.utils import remove_document_citations
 from onyx.agents.agent_search.shared_graph_utils.utils import summarize_history
 from onyx.configs.agent_configs import AGENT_MAX_STATIC_HISTORY_WORD_LENGTH
 from onyx.configs.constants import MessageType
 from onyx.context.search.models import InferenceSection
 from onyx.llm.interfaces import LLMConfig
 from onyx.llm.utils import get_max_input_tokens
@@ -21,6 +22,9 @@ from onyx.natural_language_processing.utils import tokenizer_trim_content
 from onyx.prompts.agent_search import HISTORY_FRAMING_PROMPT
 from onyx.prompts.agent_search import SUB_QUESTION_RAG_PROMPT
 from onyx.prompts.prompt_utils import build_date_time_string
 from onyx.utils.logger import setup_logger
 logger = setup_logger()
 def build_sub_question_answer_prompt(
@@ -36,9 +40,9 @@ def build_sub_question_answer_prompt(
    date_str = build_date_time_string()
    # TODO: This should include document metadata and title
    docs_format_list = [
-        f"""Document Number: [D{doc_num + 1}]\n
+        f"Document Number: [D{doc_num + 1}]\nContent: {doc.combined_content}\n\n"
                             Content: {doc.combined_content}\n\n"""
        for doc_num, doc in enumerate(docs)
    ]
@@ -88,7 +92,6 @@ def trim_prompt_piece(config: LLMConfig, prompt_piece: str, reserved_str: str) -
 def build_history_prompt(config: GraphConfig, question: str) -> str:
    prompt_builder = config.inputs.prompt_builder
    model = config.tooling.fast_llm
    persona_base = get_persona_agent_prompt_expressions(
        config.inputs.search_request.persona
    ).base_prompt
@@ -102,23 +105,31 @@ def build_history_prompt(config: GraphConfig, question: str) -> str:
        history_components = []
        previous_message_type = None
        for message in prompt_builder.raw_message_history:
-            if "user" in message.message_type:
+            if message.message_type == MessageType.USER:
                history_components.append(f"User: {message.message}\n")
-                previous_message_type = "user"
+                previous_message_type = MessageType.USER
-            elif "assistant" in message.message_type:
+            elif message.message_type == MessageType.ASSISTANT:
-                # only use the last agent answer for the history
+                # Previously there could be multiple assistant messages in a row
-                if previous_message_type != "assistant":
+                # Now this is handled at the message history construction
-                    history_components.append(f"You/Agent: {message.message}\n")
+                assert previous_message_type is not MessageType.ASSISTANT
-                else:
+                history_components.append(f"You/Agent: {message.message}\n")
-                    history_components = history_components[:-1]
+                previous_message_type = MessageType.ASSISTANT
                    history_components.append(f"You/Agent: {message.message}\n")
                previous_message_type = "assistant"
            else:
                # Other message types are not included here, currently there should be no other message types
                logger.error(
                    f"Unhandled message type: {message.message_type} with message: {message.message}"
                )
                continue
        history = "\n".join(history_components)
        history = remove_document_citations(history)
        if len(history.split()) > AGENT_MAX_STATIC_HISTORY_WORD_LENGTH:
-            history = summarize_history(history, question, persona_base, model)
+            history = summarize_history(
                history=history,
                question=question,
                persona_specification=persona_base,
                llm=config.tooling.fast_llm,
            )
    return HISTORY_FRAMING_PROMPT.format(history=history) if history else ""
--- a/backend/onyx/agents/agent_search/shared_graph_utils/models.py
+++ b/backend/onyx/agents/agent_search/shared_graph_utils/models.py
@@ -119,7 +119,7 @@ class CombinedAgentMetrics(BaseModel):
 class PersonaPromptExpressions(BaseModel):
    contextualized_prompt: str
-    base_prompt: str
+    base_prompt: str | None
 class AgentPromptEnrichmentComponents(BaseModel):
--- a/backend/onyx/agents/agent_search/shared_graph_utils/utils.py
+++ b/backend/onyx/agents/agent_search/shared_graph_utils/utils.py
@@ -56,6 +56,7 @@ from onyx.prompts.agent_search import (
 from onyx.prompts.agent_search import (
    HISTORY_CONTEXT_SUMMARY_PROMPT,
 )
 from onyx.prompts.prompt_utils import handle_onyx_date_awareness
 from onyx.tools.force import ForceUseTool
 from onyx.tools.tool_constructor import SearchToolConfig
 from onyx.tools.tool_implementations.search.search_tool import (
@@ -227,16 +228,26 @@ def get_test_config(
 def get_persona_agent_prompt_expressions(
    persona: Persona | None,
 ) -> PersonaPromptExpressions:
-    if persona is None:
+    if persona is None or len(persona.prompts) == 0:
-        persona_base = ""
+        # TODO base_prompt should be None, but no time to properly fix
-        persona_prompt = ASSISTANT_SYSTEM_PROMPT_DEFAULT
+        return PersonaPromptExpressions(
-    else:
+            contextualized_prompt=ASSISTANT_SYSTEM_PROMPT_DEFAULT, base_prompt=""
        persona_base = "\n".join([x.system_prompt for x in persona.prompts])
        persona_prompt = ASSISTANT_SYSTEM_PROMPT_PERSONA.format(
            persona_prompt=persona_base
        )
    # Only a 1:1 mapping between personas and prompts currently
    prompt = persona.prompts[0]
    prompt_config = PromptConfig.from_model(prompt)
    datetime_aware_system_prompt = handle_onyx_date_awareness(
        prompt_str=prompt_config.system_prompt,
        prompt_config=prompt_config,
        add_additional_info_if_no_tag=prompt.datetime_aware,
    )
    return PersonaPromptExpressions(
-        contextualized_prompt=persona_prompt, base_prompt=persona_base
+        contextualized_prompt=ASSISTANT_SYSTEM_PROMPT_PERSONA.format(
            persona_prompt=datetime_aware_system_prompt
        ),
        base_prompt=datetime_aware_system_prompt,
    )
@@ -322,7 +333,7 @@ def get_answer_citation_ids(answer_str: str) -> list[int]:
 def summarize_history(
-    history: str, question: str, persona_specification: str, model: LLM
+    history: str, question: str, persona_specification: str | None, llm: LLM
 ) -> str:
    history_context_prompt = remove_document_citations(
        HISTORY_CONTEXT_SUMMARY_PROMPT.format(
@@ -332,7 +343,7 @@ def summarize_history(
        )
    )
-    history_response = model.invoke(history_context_prompt)
+    history_response = llm.invoke(history_context_prompt)
    assert isinstance(history_response.content, str)
    return history_response.content
--- a/backend/onyx/chat/chat_utils.py
+++ b/backend/onyx/chat/chat_utils.py
@@ -166,6 +166,7 @@ def create_chat_chain(
        )
    current_message: ChatMessage | None = root_message
    previous_message: ChatMessage | None = None
    while current_message is not None:
        child_msg = current_message.latest_child_message
@@ -183,7 +184,17 @@ def create_chat_chain(
                "could not find next message in the same session"
            )
-        mainline_messages.append(current_message)
+        if (
            current_message.message_type == MessageType.ASSISTANT
            and previous_message is not None
            and previous_message.message_type == MessageType.ASSISTANT
            and mainline_messages
        ):
            mainline_messages[-1] = current_message
        else:
            mainline_messages.append(current_message)
        previous_message = current_message
    if not mainline_messages:
        raise RuntimeError("Could not trace chat message history")
--- a/backend/onyx/prompts/agent_search.py
+++ b/backend/onyx/prompts/agent_search.py
@@ -2,7 +2,6 @@
 SEPARATOR_LINE = "-------"
 UNKNOWN_ANSWER = "I do not have enough information to answer this question."
 NO_RECOVERED_DOCS = "No relevant information recovered"
 DATE_PROMPT = "Today is {date}.\n\n"
 SUB_CHECK_YES = "yes"
 SUB_CHECK_NO = "no"
@@ -16,9 +15,7 @@ For more context, here is the history of the conversation so far that preceded t
 """.strip()
-ASSISTANT_SYSTEM_PROMPT_DEFAULT = (
+ASSISTANT_SYSTEM_PROMPT_DEFAULT = "You are an assistant for question-answering tasks."
    """You are an assistant for question-answering tasks."""
 )
 ASSISTANT_SYSTEM_PROMPT_PERSONA = f"""
 You are an assistant for question-answering tasks. Here is more information about you:
@@ -28,21 +25,25 @@ You are an assistant for question-answering tasks. Here is more information abou
 """.strip()
-SUB_QUESTION_ANSWER_TEMPLATE = """\n
+SUB_QUESTION_ANSWER_TEMPLATE = f"""
-Sub-Question: Q{sub_question_num}\n  Sub-Question:\n  - \n{sub_question}\n  --\nAnswer:\n  -\n {sub_answer}\n\n
+Sub-Question: Q{{sub_question_num}}
-"""
+Question:
 {{sub_question}}
 {SEPARATOR_LINE}
 Answer:
 {{sub_answer}}
 """.strip()
 SUB_QUESTION_ANSWER_TEMPLATE_REFINED = f"""
-Sub-Question: Q{{sub_question_num}}\n
+Sub-Question: Q{{sub_question_num}}
-Type:
+Type: {{sub_question_type}}
-{SEPARATOR_LINE}
+
 {{sub_question_type}}
 {SEPARATOR_LINE}
 Sub-Question:
 {SEPARATOR_LINE}
 {{sub_question}}
 {SEPARATOR_LINE}
 Answer:
 {SEPARATOR_LINE}
 {{sub_answer}}
@@ -73,30 +74,33 @@ And here is the context retrieved:
 {SEPARATOR_LINE}
 Please format your answer as a json object in the following format:
-{{
+""".strip()
-    "retrieved_entities_relationships": {{
+
 ENTITY_TERM_EXTRACTION_PROMPT_JSON_EXAMPLE = """
 {
    "retrieved_entities_relationships": {
        "entities": [
-            {{
+            {
                "entity_name": "<assign a name for the entity>",
                "entity_type": "<specify a short type name for the entity, such as 'company', 'location',...>"
-            }}
+            }
        ],
        "relationships": [
-            {{
+            {
                "relationship_name": "<assign a name for the relationship>",
                "relationship_type": "<specify a short type name for the relationship, such as 'sales_to', 'is_location_of',...>",
                "relationship_entities": ["<related entity name 1>", "<related entity name 2>", "..."]
-            }}
+            }
        ],
        "terms": [
-            {{
+            {
                "term_name": "<assign a name for the term>",
                "term_type": "<specify a short type name for the term, such as 'revenue', 'market_share',...>",
                "term_similar_to": ["<list terms that are similar to this term>"]
-            }}
+            }
        ]
-    }}
+    }
-}}
+}
 """.strip()
@@ -259,79 +263,63 @@ SUB_QUESTION_RAG_PROMPT = (
 SUB_ANSWER_CHECK_PROMPT = (
-    """\n
+    "Determine whether the given answer addresses the given question. "
-Your task is to see whether a given answer addresses a given question.
+    "Please do not use any internal knowledge you may have - just focus on whether the answer "
-Please do not use any internal knowledge you may have - just focus on whether the answer
+    "as given seems to largely address the question as given, or at least addresses part of the question.\n\n"
-as given seems to largely address the question as given, or at least addresses part of the question.
+    "Here is the question:\n"
-Here is the question:
+    f"{SEPARATOR_LINE}\n"
-\n-------\n
+    "{question}\n"
-{question}
+    f"{SEPARATOR_LINE}\n\n"
-\n-------\n
+    "Here is the suggested answer:\n"
-Here is the suggested answer:
+    f"{SEPARATOR_LINE}\n"
-\n-------\n
+    "{base_answer}\n"
-{base_answer}
+    f"{SEPARATOR_LINE}\n\n"
-\n-------\n
+    f'Does the suggested answer address the question? Please answer with "{SUB_CHECK_YES}" or "{SUB_CHECK_NO}".'
-Does the suggested answer address the question? Please answer with """
+).strip()
    + f'"{SUB_CHECK_YES}" or "{SUB_CHECK_NO}".'
 )
 # Initial Answer Generation
 INITIAL_ANSWER_PROMPT_W_SUB_QUESTIONS = (
-    """ \n
+    "{persona_specification}\n\n"
-{persona_specification}
+    "Use the information provided below - and only the provided information - to answer the provided main question.\n\n"
- {date_prompt}
+    "The information provided below consists of:\n"
-Use the information provided below - and only the provided information - to answer the provided main question.
+    "  1) a number of answered sub-questions - these are very important to help you organize your thoughts and your answer\n"
-
+    "  2) a number of documents that deemed relevant for the question.\n\n"
-The information provided below consists of:
+    "{history}\n\n"
-    1) a number of answered sub-questions - these are very important to help you organize your thoughts and your answer
+    "It is critical that you provide prover inline citations to documents in the format [[D1]](), [[D2]](), [[D3]](), etc.!\n"
-    2) a number of documents that deemed relevant for the question.
+    "It is important that the citation is close to the information it supports. If you have multiple citations that support\n"
-
+    "a fact, please cite for example as [[D1]]()[[D3]](), or [[D2]]()[[D4]](), etc.\n"
-{history}
+    "Feel free to also cite sub-questions in addition to documents, but make sure that you have documents cited with the "
-
+    "sub-question citation. If you want to cite both a document and a sub-question, please use [[D1]]()[[Q3]](), or "
-It is critical that you provide prover inline citations to documents in the format [[D1]](), [[D2]](), [[D3]](), etc.!
+    "[[D2]]()[[D7]]()[[Q4]](), etc.\n"
-It is important that the citation is close to the information it supports. If you have multiple citations that support
+    "Again, please NEVER cite sub-questions without a document citation! "
-a fact, please cite for example as [[D1]]()[[D3]](), or [[D2]]()[[D4]](), etc.
+    "Proper citations are very important for the user!\n\n"
-Feel free to also cite sub-questions in addition to documents, but make sure that you have documents cited with the sub-question
+    "IMPORTANT RULES:\n"
-citation. If you want to cite both a document and a sub-question, please use [[D1]]()[[Q3]](), or [[D2]]()[[D7]]()[[Q4]](), etc.
+    " - If you cannot reliably answer the question solely using the provided information, say that you cannot reliably answer.\n"
-Again, please NEVER cite sub-questions without a document citation!
+    " You may give some additional facts you learned, but do not try to invent an answer.\n"
-Proper citations are very important for the user!
+    f' - If the information is empty or irrelevant, just say "{UNKNOWN_ANSWER}".\n'
-
+    " - If the information is relevant but not fully conclusive, specify that the information is not conclusive and say why.\n\n"
-IMPORTANT RULES:
+    "Again, you should be sure that the answer is supported by the information provided!\n\n"
- - If you cannot reliably answer the question solely using the provided information, say that you cannot reliably answer.
+    "Try to keep your answer concise. But also highlight uncertainties you may have should there be substantial ones,\n"
- You may give some additional facts you learned, but do not try to invent an answer.
+    "or assumptions you made.\n\n"
- - If the information is empty or irrelevant, just say """
+    "Here is the contextual information:\n"
-    + f'"{UNKNOWN_ANSWER}"'
+    "---------------\n\n"
-    + """.
+    "*Answered Sub-questions (these should really matter!):\n"
- - If the information is relevant but not fully conclusive, specify that the information is not conclusive and say why.
+    f"{SEPARATOR_LINE}\n"
-
+    "{answered_sub_questions}\n"
-Again, you should be sure that the answer is supported by the information provided!
+    f"{SEPARATOR_LINE}\n\n"
-
+    "And here are relevant document information that support the sub-question answers, "
-Try to keep your answer concise. But also highlight uncertainties you may have should there be substantial ones,
+    "or that are relevant for the actual question:\n"
-or assumptions you made.
+    f"{SEPARATOR_LINE}\n"
-
+    "{relevant_docs}\n"
-Here is the contextual information:
+    f"{SEPARATOR_LINE}\n\n"
---------------
+    "And here is the question I want you to answer based on the information above:\n"
-
+    f"{SEPARATOR_LINE}\n"
-*Answered Sub-questions (these should really matter!):
+    "{question}\n"
-\n-------\n
+    f"{SEPARATOR_LINE}\n\n"
-{answered_sub_questions}
+    "Please keep your answer brief and concise, and focus on facts and data.\n\n"
-\n-------\n
+    "Answer:"
-
+).strip()
 And here are relevant document information that support the sub-question answers, or that are relevant for the actual question:\n
 \n-------\n
 {relevant_docs}
 \n-------\n
 And here is the question I want you to answer based on the information above:
 \n-------\n
 {question}
 \n-------\n\n
 Please keep your answer brief and concise, and focus on facts and data.
 Answer:"""
 )
 # used if sub_question_answer_str is empty
@@ -339,7 +327,6 @@ INITIAL_ANSWER_PROMPT_WO_SUB_QUESTIONS = (
    """\n
 {answered_sub_questions}
 {persona_specification}
 {date_prompt}
 Use the information provided below - and only the provided information - to answer the provided question.
 The information provided below consists of a number of documents that were deemed relevant for the question.
@@ -465,7 +452,7 @@ Generate the list of questions separated by one new line like this:
 REFINED_ANSWER_PROMPT_W_SUB_QUESTIONS = (
    """\n
 {persona_specification}
-{date_prompt}
+
 Your task is to improve on a given answer to a question, as the initial answer was found to be lacking in some way.
 Use the information provided below - and only the provided information - to write your new and improved answer.
@@ -542,7 +529,7 @@ REFINED_ANSWER_PROMPT_WO_SUB_QUESTIONS = (
    """\n
 {answered_sub_questions}\n
 {persona_specification}
-{date_prompt}
+
 Use the information provided below - and only the
 provided information - to answer the provided question.