mirror of
https://github.com/danswer-ai/danswer.git
synced 2025-06-06 21:19:54 +02:00
153 lines
4.7 KiB
Python
153 lines
4.7 KiB
Python
from dataclasses import dataclass
|
|
|
|
from onyx.access.utils import prefix_external_group
|
|
from onyx.access.utils import prefix_user_email
|
|
from onyx.access.utils import prefix_user_group
|
|
from onyx.configs.constants import PUBLIC_DOC_PAT
|
|
|
|
|
|
@dataclass(frozen=True)
|
|
class ExternalAccess:
|
|
# Emails of external users with access to the doc externally
|
|
external_user_emails: set[str]
|
|
# Names or external IDs of groups with access to the doc
|
|
external_user_group_ids: set[str]
|
|
# Whether the document is public in the external system or Onyx
|
|
is_public: bool
|
|
|
|
def __str__(self) -> str:
|
|
"""Prevent extremely long logs"""
|
|
|
|
def truncate_set(s: set[str], max_len: int = 100) -> str:
|
|
s_str = str(s)
|
|
if len(s_str) > max_len:
|
|
return f"{s_str[:max_len]}... ({len(s)} items)"
|
|
return s_str
|
|
|
|
return (
|
|
f"ExternalAccess("
|
|
f"external_user_emails={truncate_set(self.external_user_emails)}, "
|
|
f"external_user_group_ids={truncate_set(self.external_user_group_ids)}, "
|
|
f"is_public={self.is_public})"
|
|
)
|
|
|
|
|
|
@dataclass(frozen=True)
|
|
class DocExternalAccess:
|
|
"""
|
|
This is just a class to wrap the external access and the document ID
|
|
together. It's used for syncing document permissions to Vespa.
|
|
"""
|
|
|
|
external_access: ExternalAccess
|
|
# The document ID
|
|
doc_id: str
|
|
|
|
def to_dict(self) -> dict:
|
|
return {
|
|
"external_access": {
|
|
"external_user_emails": list(self.external_access.external_user_emails),
|
|
"external_user_group_ids": list(
|
|
self.external_access.external_user_group_ids
|
|
),
|
|
"is_public": self.external_access.is_public,
|
|
},
|
|
"doc_id": self.doc_id,
|
|
}
|
|
|
|
@classmethod
|
|
def from_dict(cls, data: dict) -> "DocExternalAccess":
|
|
external_access = ExternalAccess(
|
|
external_user_emails=set(
|
|
data["external_access"].get("external_user_emails", [])
|
|
),
|
|
external_user_group_ids=set(
|
|
data["external_access"].get("external_user_group_ids", [])
|
|
),
|
|
is_public=data["external_access"]["is_public"],
|
|
)
|
|
return cls(
|
|
external_access=external_access,
|
|
doc_id=data["doc_id"],
|
|
)
|
|
|
|
|
|
@dataclass(frozen=True, init=False)
|
|
class DocumentAccess(ExternalAccess):
|
|
# User emails for Onyx users, None indicates admin
|
|
user_emails: set[str | None]
|
|
|
|
# Names of user groups associated with this document
|
|
user_groups: set[str]
|
|
|
|
external_user_emails: set[str]
|
|
external_user_group_ids: set[str]
|
|
is_public: bool
|
|
|
|
def __init__(self) -> None:
|
|
raise TypeError(
|
|
"Use `DocumentAccess.build(...)` instead of creating an instance directly."
|
|
)
|
|
|
|
def to_acl(self) -> set[str]:
|
|
# the acl's emitted by this function are prefixed by type
|
|
# to get the native objects, access the member variables directly
|
|
|
|
acl_set: set[str] = set()
|
|
for user_email in self.user_emails:
|
|
if user_email:
|
|
acl_set.add(prefix_user_email(user_email))
|
|
|
|
for group_name in self.user_groups:
|
|
acl_set.add(prefix_user_group(group_name))
|
|
|
|
for external_user_email in self.external_user_emails:
|
|
acl_set.add(prefix_user_email(external_user_email))
|
|
|
|
for external_group_id in self.external_user_group_ids:
|
|
acl_set.add(prefix_external_group(external_group_id))
|
|
|
|
if self.is_public:
|
|
acl_set.add(PUBLIC_DOC_PAT)
|
|
|
|
return acl_set
|
|
|
|
@classmethod
|
|
def build(
|
|
cls,
|
|
user_emails: list[str | None],
|
|
user_groups: list[str],
|
|
external_user_emails: list[str],
|
|
external_user_group_ids: list[str],
|
|
is_public: bool,
|
|
) -> "DocumentAccess":
|
|
"""Don't prefix incoming data wth acl type, prefix on read from to_acl!"""
|
|
|
|
obj = object.__new__(cls)
|
|
object.__setattr__(
|
|
obj, "user_emails", {user_email for user_email in user_emails if user_email}
|
|
)
|
|
object.__setattr__(obj, "user_groups", set(user_groups))
|
|
object.__setattr__(
|
|
obj,
|
|
"external_user_emails",
|
|
{external_email for external_email in external_user_emails},
|
|
)
|
|
object.__setattr__(
|
|
obj,
|
|
"external_user_group_ids",
|
|
{external_group_id for external_group_id in external_user_group_ids},
|
|
)
|
|
object.__setattr__(obj, "is_public", is_public)
|
|
|
|
return obj
|
|
|
|
|
|
default_public_access = DocumentAccess.build(
|
|
external_user_emails=[],
|
|
external_user_group_ids=[],
|
|
user_emails=[],
|
|
user_groups=[],
|
|
is_public=True,
|
|
)
|