From 143b50c519d916c81e072d8ca406bf0d87750761 Mon Sep 17 00:00:00 2001 From: Vikas Neha Ojha Date: Thu, 2 May 2024 06:58:34 +0530 Subject: [PATCH] Save correct document url from document360 (#1413) --- backend/danswer/connectors/document360/connector.py | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/backend/danswer/connectors/document360/connector.py b/backend/danswer/connectors/document360/connector.py index c2fda5ac2..aab6d4dfa 100644 --- a/backend/danswer/connectors/document360/connector.py +++ b/backend/danswer/connectors/document360/connector.py @@ -28,7 +28,7 @@ from danswer.connectors.models import Section # 2. Only the HTML Articles are supported, Document360 also has a Markdown and "Block" format # 3. The contents are not as cleaned up as other HTML connectors -DOCUMENT360_BASE_URL = "https://preview.portal.document360.io/" +DOCUMENT360_BASE_URL = "https://portal.document360.io" DOCUMENT360_API_BASE_URL = "https://apihub.document360.io/v2" @@ -142,7 +142,11 @@ class Document360Connector(LoadConnector, PollConnector): if author["email_id"] ] - doc_link = f"{DOCUMENT360_BASE_URL}/{self.portal_id}/document/v1/view/{article['id']}" + doc_link = ( + article_details["url"] + if article_details.get("url") + else f"{DOCUMENT360_BASE_URL}/{self.portal_id}/document/v1/view/{article['id']}" + ) html_content = article_details["html_content"] article_content = (