Fix non-json model output processing (#332)

2025-09-25 11:16:43 +02:00 · 2023-08-24 19:43:58 -07:00
parent 6897416fe6
commit cb13f5b18b
1 changed files with 2 additions and 3 deletions
--- a/backend/danswer/direct_qa/qa_utils.py
+++ b/backend/danswer/direct_qa/qa_utils.py
@@ -211,8 +211,7 @@ def process_model_tokens(
        model_previous = model_output
        model_output += token
-        trimmed_combine = model_output.replace(" ", "").replace("\n", "")
+        if not found_answer_start and '{"answer":"' in re.sub(r"\s", "", model_output):
        if not found_answer_start and '{"answer":"' in trimmed_combine:
            # Note, if the token that completes the pattern has additional text, for example if the token is "?
            # Then the chars after " will not be streamed, but this is ok as it prevents streaming the ? in the
            # event that the model outputs the UNCERTAINTY_PAT
@@ -232,7 +231,7 @@ def process_model_tokens(
                if hold_quote + token in quote_pat_full:
                    hold_quote += token
                    continue
-            yield DanswerAnswerPiece(answer_piece=token)
+            yield DanswerAnswerPiece(answer_piece=hold_quote + token)
            hold_quote = ""
    logger.debug(f"Raw model output: {model_output}")