fixed id retrieval from zip metadata (#1813)

This commit is contained in:
hagen-danswer 2024-07-11 20:38:12 -07:00 committed by GitHub
parent e50820e65e
commit 8c312482c1
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -85,6 +85,11 @@ def _process_file(
all_metadata = {**metadata, **file_metadata} if metadata else file_metadata
# add a prefix to avoid conflicts with other connectors
doc_id = f"FILE_CONNECTOR__{file_name}"
if metadata:
doc_id = metadata.get("id") or doc_id
# If this is set, we will show this in the UI as the "name" of the file
file_display_name = all_metadata.get("file_display_name") or os.path.basename(
file_name
@ -132,7 +137,7 @@ def _process_file(
return [
Document(
id=f"FILE_CONNECTOR__{file_name}", # add a prefix to avoid conflicts with other connectors
id=doc_id,
sections=[
Section(link=all_metadata.get("link"), text=file_content_raw.strip())
],