From d5938189967fd6fb14e732cbc621859eae42e00e Mon Sep 17 00:00:00 2001 From: Yuhong Sun Date: Mon, 4 Sep 2023 17:24:31 -0700 Subject: [PATCH] Use Vespa Doc ID directly instead of from fields (#399) --- backend/danswer/datastores/vespa/store.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/backend/danswer/datastores/vespa/store.py b/backend/danswer/datastores/vespa/store.py index 16b21c4ca..5d4b3b0a9 100644 --- a/backend/danswer/datastores/vespa/store.py +++ b/backend/danswer/datastores/vespa/store.py @@ -104,9 +104,7 @@ def _get_vespa_chunk_ids_by_document_id( while True: results = requests.get(SEARCH_ENDPOINT, params=params).json() hits = results["root"].get("children", []) - doc_chunk_ids.extend( - [hit.get("fields", {}).get("documentid").split("::")[1] for hit in hits] - ) + doc_chunk_ids.extend([hit["id"].split("::")[1] for hit in hits]) params["offset"] += hits_per_page # type: ignore if len(hits) < hits_per_page: