Use Vespa Doc ID directly instead of from fields (#399)

2025-07-04 03:31:23 +02:00 · 2023-09-04 17:24:31 -07:00
parent f7cc7190fe
commit d593818996
1 changed files with 1 additions and 3 deletions
--- a/backend/danswer/datastores/vespa/store.py
+++ b/backend/danswer/datastores/vespa/store.py
@ -104,9 +104,7 @@ def _get_vespa_chunk_ids_by_document_id(
    while True:
        results = requests.get(SEARCH_ENDPOINT, params=params).json()
        hits = results["root"].get("children", [])
-        doc_chunk_ids.extend(
+        doc_chunk_ids.extend([hit["id"].split("::")[1] for hit in hits])
            [hit.get("fields", {}).get("documentid").split("::")[1] for hit in hits]
        )
        params["offset"] += hits_per_page  # type: ignore
        if len(hits) < hits_per_page: