From 0c58c8d6cb8e00f504505953ad880714348611d6 Mon Sep 17 00:00:00 2001
From: Chris Weaver <25087905+Weves@users.noreply.github.com>
Date: Tue, 26 Sep 2023 12:53:19 -0700
Subject: [PATCH] Adding Document Sets (#477)

Adds:
- name for connector credential pairs + frontend changes to start populating this field
- document set table migration
- during indexing, document sets are now checked and inserted into Vespa
- background job to check if document sets need to be synced
- document set management APIs
- document set management dashboard in the UI
---
 .../57b53544726e_add_document_set_tables.py   |  59 ++++
 ...24ae9_add_id_to_connectorcredentialpair.py |  60 ++++
 backend/danswer/background/celery.py          |  88 ------
 backend/danswer/background/celery/celery.py   |  29 ++
 .../danswer/background/celery/celery_utils.py |  37 +++
 .../background/celery/deletion_utils.py       |  41 +++
 .../background/document_set_sync_script.py    |  53 ++++
 backend/danswer/background/utils.py           |   7 +-
 .../danswer/datastores/indexing_pipeline.py   |  11 +-
 .../danswer/db/connector_credential_pair.py   |   2 +
 backend/danswer/db/document_set.py            | 282 ++++++++++++++++++
 backend/danswer/db/models.py                  |  56 ++++
 backend/danswer/document_set/document_set.py  |  65 ++++
 backend/danswer/main.py                       |   2 +
 backend/danswer/server/document_set.py        | 101 +++++++
 backend/danswer/server/manage.py              |  27 +-
 backend/danswer/server/models.py              |  33 ++
 backend/supervisord.conf                      |   9 +-
 .../app/admin/connectors/bookstack/page.tsx   |  19 +-
 .../app/admin/connectors/confluence/page.tsx  |  32 +-
 web/src/app/admin/connectors/file/page.tsx    |  98 +++---
 web/src/app/admin/connectors/github/page.tsx  |  16 +-
 .../admin/connectors/google-drive/page.tsx    |   7 +-
 web/src/app/admin/connectors/guru/page.tsx    |  13 +-
 web/src/app/admin/connectors/jira/page.tsx    |  22 +-
 web/src/app/admin/connectors/linear/page.tsx  |  14 +-
 web/src/app/admin/connectors/notion/page.tsx  |  16 +-
 .../admin/connectors/productboard/page.tsx    |  20 +-
 web/src/app/admin/connectors/slab/page.tsx    |  16 +-
 web/src/app/admin/connectors/slack/page.tsx   | 105 +++----
 web/src/app/admin/connectors/web/page.tsx     |   9 +-
 web/src/app/admin/connectors/zulip/page.tsx   |  10 +-
 .../sets/DocumentSetCreationForm.tsx          | 179 +++++++++++
 web/src/app/admin/documents/sets/hooks.tsx    |  13 +
 web/src/app/admin/documents/sets/lib.ts       |  56 ++++
 web/src/app/admin/documents/sets/page.tsx     | 268 +++++++++++++++++
 web/src/app/admin/indexing/status/page.tsx    | 111 +------
 web/src/app/admin/layout.tsx                  |  10 +
 web/src/components/Loading.tsx                |  20 ++
 .../admin/connectors/ConnectorForm.tsx        | 105 +++++--
 .../admin/connectors/ConnectorTitle.tsx       | 109 +++++++
 web/src/components/admin/connectors/Field.tsx |  24 +-
 .../table/SingleUseConnectorsTable.tsx        |   5 +
 web/src/components/icons/icons.tsx            |   8 +
 web/src/lib/credential.ts                     |   9 +-
 web/src/lib/hooks.ts                          |  24 +-
 web/src/lib/types.ts                          |  18 ++
 47 files changed, 1887 insertions(+), 431 deletions(-)
 create mode 100644 backend/alembic/versions/57b53544726e_add_document_set_tables.py
 create mode 100644 backend/alembic/versions/800f48024ae9_add_id_to_connectorcredentialpair.py
 delete mode 100644 backend/danswer/background/celery.py
 create mode 100644 backend/danswer/background/celery/celery.py
 create mode 100644 backend/danswer/background/celery/celery_utils.py
 create mode 100644 backend/danswer/background/celery/deletion_utils.py
 create mode 100644 backend/danswer/background/document_set_sync_script.py
 create mode 100644 backend/danswer/db/document_set.py
 create mode 100644 backend/danswer/document_set/document_set.py
 create mode 100644 backend/danswer/server/document_set.py
 create mode 100644 web/src/app/admin/documents/sets/DocumentSetCreationForm.tsx
 create mode 100644 web/src/app/admin/documents/sets/hooks.tsx
 create mode 100644 web/src/app/admin/documents/sets/lib.ts
 create mode 100644 web/src/app/admin/documents/sets/page.tsx
 create mode 100644 web/src/components/admin/connectors/ConnectorTitle.tsx

diff --git a/backend/alembic/versions/57b53544726e_add_document_set_tables.py b/backend/alembic/versions/57b53544726e_add_document_set_tables.py
new file mode 100644
index 000000000..719f43f23
--- /dev/null
+++ b/backend/alembic/versions/57b53544726e_add_document_set_tables.py
@@ -0,0 +1,59 @@
+"""Add document set tables
+
+Revision ID: 57b53544726e
+Revises: 800f48024ae9
+Create Date: 2023-09-20 16:59:39.097177
+
+"""
+from alembic import op
+import fastapi_users_db_sqlalchemy
+import sqlalchemy as sa
+
+# revision identifiers, used by Alembic.
+revision = "57b53544726e"
+down_revision = "800f48024ae9"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.create_table(
+        "document_set",
+        sa.Column("id", sa.Integer(), nullable=False),
+        sa.Column("name", sa.String(), nullable=False),
+        sa.Column("description", sa.String(), nullable=False),
+        sa.Column(
+            "user_id",
+            fastapi_users_db_sqlalchemy.generics.GUID(),
+            nullable=True,
+        ),
+        sa.Column("is_up_to_date", sa.Boolean(), nullable=False),
+        sa.ForeignKeyConstraint(
+            ["user_id"],
+            ["user.id"],
+        ),
+        sa.PrimaryKeyConstraint("id"),
+        sa.UniqueConstraint("name"),
+    )
+    op.create_table(
+        "document_set__connector_credential_pair",
+        sa.Column("document_set_id", sa.Integer(), nullable=False),
+        sa.Column("connector_credential_pair_id", sa.Integer(), nullable=False),
+        sa.Column("is_current", sa.Boolean(), nullable=False),
+        sa.ForeignKeyConstraint(
+            ["connector_credential_pair_id"],
+            ["connector_credential_pair.id"],
+        ),
+        sa.ForeignKeyConstraint(
+            ["document_set_id"],
+            ["document_set.id"],
+        ),
+        sa.PrimaryKeyConstraint(
+            "document_set_id", "connector_credential_pair_id", "is_current"
+        ),
+    )
+
+
+def downgrade() -> None:
+    op.drop_table("document_set__connector_credential_pair")
+    op.drop_table("document_set")
diff --git a/backend/alembic/versions/800f48024ae9_add_id_to_connectorcredentialpair.py b/backend/alembic/versions/800f48024ae9_add_id_to_connectorcredentialpair.py
new file mode 100644
index 000000000..3074a8af0
--- /dev/null
+++ b/backend/alembic/versions/800f48024ae9_add_id_to_connectorcredentialpair.py
@@ -0,0 +1,60 @@
+"""Add ID to ConnectorCredentialPair
+
+Revision ID: 800f48024ae9
+Revises: 767f1c2a00eb
+Create Date: 2023-09-19 16:13:42.299715
+
+"""
+from alembic import op
+import sqlalchemy as sa
+from sqlalchemy.schema import Sequence, CreateSequence
+
+# revision identifiers, used by Alembic.
+revision = "800f48024ae9"
+down_revision = "767f1c2a00eb"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    sequence = Sequence("connector_credential_pair_id_seq")
+    op.execute(CreateSequence(sequence))  # type: ignore
+    op.add_column(
+        "connector_credential_pair",
+        sa.Column(
+            "id", sa.Integer(), nullable=True, server_default=sequence.next_value()
+        ),
+    )
+    op.add_column(
+        "connector_credential_pair",
+        sa.Column("name", sa.String(), nullable=True),
+    )
+
+    # fill in IDs for existing rows
+    op.execute(
+        "UPDATE connector_credential_pair SET id = nextval('connector_credential_pair_id_seq') WHERE id IS NULL"
+    )
+    op.alter_column("connector_credential_pair", "id", nullable=False)
+
+    op.create_unique_constraint(
+        "connector_credential_pair__name__key", "connector_credential_pair", ["name"]
+    )
+    op.create_unique_constraint(
+        "connector_credential_pair__id__key", "connector_credential_pair", ["id"]
+    )
+
+
+def downgrade() -> None:
+    op.drop_constraint(
+        "connector_credential_pair__name__key",
+        "connector_credential_pair",
+        type_="unique",
+    )
+    op.drop_constraint(
+        "connector_credential_pair__id__key",
+        "connector_credential_pair",
+        type_="unique",
+    )
+    op.drop_column("connector_credential_pair", "name")
+    op.drop_column("connector_credential_pair", "id")
+    op.execute("DROP SEQUENCE connector_credential_pair_id_seq")
diff --git a/backend/danswer/background/celery.py b/backend/danswer/background/celery.py
deleted file mode 100644
index 2325adcb9..000000000
--- a/backend/danswer/background/celery.py
+++ /dev/null
@@ -1,88 +0,0 @@
-import json
-from typing import cast
-
-from celery import Celery
-from celery.result import AsyncResult
-from sqlalchemy import text
-from sqlalchemy.orm import Session
-
-from danswer.background.connector_deletion import cleanup_connector_credential_pair
-from danswer.background.connector_deletion import get_cleanup_task_id
-from danswer.db.engine import build_connection_string
-from danswer.db.engine import get_sqlalchemy_engine
-from danswer.db.engine import SYNC_DB_API
-from danswer.db.models import DeletionStatus
-from danswer.server.models import DeletionAttemptSnapshot
-
-celery_broker_url = "sqla+" + build_connection_string(db_api=SYNC_DB_API)
-celery_backend_url = "db+" + build_connection_string(db_api=SYNC_DB_API)
-celery_app = Celery(__name__, broker=celery_broker_url, backend=celery_backend_url)
-
-
-@celery_app.task(soft_time_limit=60 * 60 * 6)  # 6 hour time limit
-def cleanup_connector_credential_pair_task(
-    connector_id: int, credential_id: int
-) -> int:
-    return cleanup_connector_credential_pair(connector_id, credential_id)
-
-
-def get_deletion_status(
-    connector_id: int, credential_id: int
-) -> DeletionAttemptSnapshot | None:
-    cleanup_task_id = get_cleanup_task_id(
-        connector_id=connector_id, credential_id=credential_id
-    )
-    deletion_task = get_celery_task(task_id=cleanup_task_id)
-    deletion_task_status = get_celery_task_status(task_id=cleanup_task_id)
-
-    deletion_status = None
-    error_msg = None
-    num_docs_deleted = 0
-    if deletion_task_status == "SUCCESS":
-        deletion_status = DeletionStatus.SUCCESS
-        num_docs_deleted = cast(int, deletion_task.get(propagate=False))
-    elif deletion_task_status == "FAILURE":
-        deletion_status = DeletionStatus.FAILED
-        error_msg = deletion_task.get(propagate=False)
-    elif deletion_task_status == "STARTED" or deletion_task_status == "PENDING":
-        deletion_status = DeletionStatus.IN_PROGRESS
-
-    return (
-        DeletionAttemptSnapshot(
-            connector_id=connector_id,
-            credential_id=credential_id,
-            status=deletion_status,
-            error_msg=str(error_msg),
-            num_docs_deleted=num_docs_deleted,
-        )
-        if deletion_status
-        else None
-    )
-
-
-def get_celery_task(task_id: str) -> AsyncResult:
-    """NOTE: even if the task doesn't exist, celery will still return something
-    with a `PENDING` state"""
-    return AsyncResult(task_id, backend=celery_app.backend)
-
-
-def get_celery_task_status(task_id: str) -> str | None:
-    """NOTE: is tightly coupled to the internals of kombu (which is the
-    translation layer to allow us to use Postgres as a broker). If we change
-    the broker, this will need to be updated.
-
-    This should not be called on any critical flows.
-    """
-    task = get_celery_task(task_id)
-    # if not pending, then we know the task really exists
-    if task.status != "PENDING":
-        return task.status
-
-    with Session(get_sqlalchemy_engine()) as session:
-        rows = session.execute(text("SELECT payload FROM kombu_message WHERE visible"))
-        for row in rows:
-            payload = json.loads(row[0])
-            if payload["headers"]["id"] == task_id:
-                return "PENDING"
-
-    return None
diff --git a/backend/danswer/background/celery/celery.py b/backend/danswer/background/celery/celery.py
new file mode 100644
index 000000000..47de830b1
--- /dev/null
+++ b/backend/danswer/background/celery/celery.py
@@ -0,0 +1,29 @@
+from celery import Celery
+
+from danswer.background.connector_deletion import cleanup_connector_credential_pair
+from danswer.db.engine import build_connection_string
+from danswer.db.engine import SYNC_DB_API
+from danswer.document_set.document_set import sync_document_set
+from danswer.utils.logger import setup_logger
+
+logger = setup_logger()
+
+celery_broker_url = "sqla+" + build_connection_string(db_api=SYNC_DB_API)
+celery_backend_url = "db+" + build_connection_string(db_api=SYNC_DB_API)
+celery_app = Celery(__name__, broker=celery_broker_url, backend=celery_backend_url)
+
+
+@celery_app.task(soft_time_limit=60 * 60 * 6)  # 6 hour time limit
+def cleanup_connector_credential_pair_task(
+    connector_id: int, credential_id: int
+) -> int:
+    return cleanup_connector_credential_pair(connector_id, credential_id)
+
+
+@celery_app.task(soft_time_limit=60 * 60 * 6)  # 6 hour time limit
+def sync_document_set_task(document_set_id: int) -> None:
+    try:
+        return sync_document_set(document_set_id=document_set_id)
+    except Exception:
+        logger.exception("Failed to sync document set %s", document_set_id)
+        raise
diff --git a/backend/danswer/background/celery/celery_utils.py b/backend/danswer/background/celery/celery_utils.py
new file mode 100644
index 000000000..c58624065
--- /dev/null
+++ b/backend/danswer/background/celery/celery_utils.py
@@ -0,0 +1,37 @@
+import json
+
+from celery.result import AsyncResult
+from sqlalchemy import text
+from sqlalchemy.orm import Session
+
+from danswer.background.celery.celery import celery_app
+from danswer.db.engine import get_sqlalchemy_engine
+
+
+def get_celery_task(task_id: str) -> AsyncResult:
+    """NOTE: even if the task doesn't exist, celery will still return something
+    with a `PENDING` state"""
+    return AsyncResult(task_id, backend=celery_app.backend)
+
+
+def get_celery_task_status(task_id: str) -> str | None:
+    """NOTE: is tightly coupled to the internals of kombu (which is the
+    translation layer to allow us to use Postgres as a broker). If we change
+    the broker, this will need to be updated.
+
+    This should not be called on any critical flows.
+    """
+    # first check for any pending tasks
+    with Session(get_sqlalchemy_engine()) as session:
+        rows = session.execute(text("SELECT payload FROM kombu_message WHERE visible"))
+        for row in rows:
+            payload = json.loads(row[0])
+            if payload["headers"]["id"] == task_id:
+                return "PENDING"
+
+    task = get_celery_task(task_id)
+    # if not pending, then we know the task really exists
+    if task.status != "PENDING":
+        return task.status
+
+    return None
diff --git a/backend/danswer/background/celery/deletion_utils.py b/backend/danswer/background/celery/deletion_utils.py
new file mode 100644
index 000000000..c6d056022
--- /dev/null
+++ b/backend/danswer/background/celery/deletion_utils.py
@@ -0,0 +1,41 @@
+from typing import cast
+
+from danswer.background.celery.celery_utils import get_celery_task
+from danswer.background.celery.celery_utils import get_celery_task_status
+from danswer.background.connector_deletion import get_cleanup_task_id
+from danswer.db.models import DeletionStatus
+from danswer.server.models import DeletionAttemptSnapshot
+
+
+def get_deletion_status(
+    connector_id: int, credential_id: int
+) -> DeletionAttemptSnapshot | None:
+    cleanup_task_id = get_cleanup_task_id(
+        connector_id=connector_id, credential_id=credential_id
+    )
+    deletion_task = get_celery_task(task_id=cleanup_task_id)
+    deletion_task_status = get_celery_task_status(task_id=cleanup_task_id)
+
+    deletion_status = None
+    error_msg = None
+    num_docs_deleted = 0
+    if deletion_task_status == "SUCCESS":
+        deletion_status = DeletionStatus.SUCCESS
+        num_docs_deleted = cast(int, deletion_task.get(propagate=False))
+    elif deletion_task_status == "FAILURE":
+        deletion_status = DeletionStatus.FAILED
+        error_msg = deletion_task.get(propagate=False)
+    elif deletion_task_status == "STARTED" or deletion_task_status == "PENDING":
+        deletion_status = DeletionStatus.IN_PROGRESS
+
+    return (
+        DeletionAttemptSnapshot(
+            connector_id=connector_id,
+            credential_id=credential_id,
+            status=deletion_status,
+            error_msg=str(error_msg),
+            num_docs_deleted=num_docs_deleted,
+        )
+        if deletion_status
+        else None
+    )
diff --git a/backend/danswer/background/document_set_sync_script.py b/backend/danswer/background/document_set_sync_script.py
new file mode 100644
index 000000000..37ce3be05
--- /dev/null
+++ b/backend/danswer/background/document_set_sync_script.py
@@ -0,0 +1,53 @@
+from celery.result import AsyncResult
+from sqlalchemy.orm import Session
+
+from danswer.background.celery.celery import sync_document_set_task
+from danswer.background.utils import interval_run_job
+from danswer.db.document_set import (
+    fetch_document_sets,
+)
+from danswer.db.engine import get_sqlalchemy_engine
+from danswer.utils.logger import setup_logger
+
+logger = setup_logger()
+
+
+_ExistingTaskCache: dict[int, AsyncResult] = {}
+
+
+def _document_sync_loop() -> None:
+    # cleanup tasks
+    existing_tasks = list(_ExistingTaskCache.items())
+    for document_set_id, task in existing_tasks:
+        if task.ready():
+            logger.info(
+                f"Document set '{document_set_id}' is complete with status "
+                f"{task.status}. Cleaning up."
+            )
+            del _ExistingTaskCache[document_set_id]
+
+    # kick off new tasks
+    with Session(get_sqlalchemy_engine()) as db_session:
+        # check if any document sets are not synced
+        document_set_info = fetch_document_sets(db_session=db_session)
+        for document_set, _ in document_set_info:
+            if not document_set.is_up_to_date:
+                if document_set.id in _ExistingTaskCache:
+                    logger.info(
+                        f"Document set '{document_set.id}' is already syncing. Skipping."
+                    )
+                    continue
+
+                logger.info(
+                    f"Document set {document_set.id} is not synced. Syncing now!"
+                )
+                task = sync_document_set_task.apply_async(
+                    kwargs=dict(document_set_id=document_set.id),
+                )
+                _ExistingTaskCache[document_set.id] = task
+
+
+if __name__ == "__main__":
+    interval_run_job(
+        job=_document_sync_loop, delay=5, emit_job_start_log=False
+    )  # run every 5 seconds
diff --git a/backend/danswer/background/utils.py b/backend/danswer/background/utils.py
index 8103d82ce..b822e9571 100644
--- a/backend/danswer/background/utils.py
+++ b/backend/danswer/background/utils.py
@@ -8,10 +8,13 @@ from danswer.utils.logger import setup_logger
 logger = setup_logger()
 
 
-def interval_run_job(job: Callable[[], Any], delay: int | float) -> None:
+def interval_run_job(
+    job: Callable[[], Any], delay: int | float, emit_job_start_log: bool = True
+) -> None:
     while True:
         start = time.time()
-        logger.info(f"Running '{job.__name__}', current time: {time.ctime(start)}")
+        if emit_job_start_log:
+            logger.info(f"Running '{job.__name__}', current time: {time.ctime(start)}")
         try:
             job()
         except Exception as e:
diff --git a/backend/danswer/datastores/indexing_pipeline.py b/backend/danswer/datastores/indexing_pipeline.py
index c6b0cfbdd..ea395f368 100644
--- a/backend/danswer/datastores/indexing_pipeline.py
+++ b/backend/danswer/datastores/indexing_pipeline.py
@@ -16,6 +16,7 @@ from danswer.datastores.interfaces import DocumentIndex
 from danswer.datastores.interfaces import DocumentMetadata
 from danswer.db.document import prepare_to_modify_documents
 from danswer.db.document import upsert_documents_complete
+from danswer.db.document_set import fetch_document_sets_for_documents
 from danswer.db.engine import get_sqlalchemy_engine
 from danswer.search.models import Embedder
 from danswer.search.semantic_search import DefaultEmbedder
@@ -99,11 +100,19 @@ def _indexing_pipeline(
         document_id_to_access_info = get_access_for_documents(
             document_ids=document_ids, db_session=db_session
         )
+        document_id_to_document_set = {
+            document_id: document_sets
+            for document_id, document_sets in fetch_document_sets_for_documents(
+                document_ids=document_ids, db_session=db_session
+            )
+        }
         access_aware_chunks = [
             DocMetadataAwareIndexChunk.from_index_chunk(
                 index_chunk=chunk,
                 access=document_id_to_access_info[chunk.source_document.id],
-                document_sets=set(),
+                document_sets=set(
+                    document_id_to_document_set.get(chunk.source_document.id, [])
+                ),
             )
             for chunk in chunks_with_embeddings
         ]
diff --git a/backend/danswer/db/connector_credential_pair.py b/backend/danswer/db/connector_credential_pair.py
index ac6d5dcc0..2b1767f1e 100644
--- a/backend/danswer/db/connector_credential_pair.py
+++ b/backend/danswer/db/connector_credential_pair.py
@@ -110,6 +110,7 @@ def mark_all_in_progress_cc_pairs_failed(
 def add_credential_to_connector(
     connector_id: int,
     credential_id: int,
+    cc_pair_name: str | None,
     user: User,
     db_session: Session,
 ) -> StatusResponse[int]:
@@ -143,6 +144,7 @@ def add_credential_to_connector(
     association = ConnectorCredentialPair(
         connector_id=connector_id,
         credential_id=credential_id,
+        name=cc_pair_name,
     )
     db_session.add(association)
     db_session.commit()
diff --git a/backend/danswer/db/document_set.py b/backend/danswer/db/document_set.py
new file mode 100644
index 000000000..aacc2243d
--- /dev/null
+++ b/backend/danswer/db/document_set.py
@@ -0,0 +1,282 @@
+from collections.abc import Sequence
+from typing import cast
+from uuid import UUID
+
+from sqlalchemy import and_
+from sqlalchemy import delete
+from sqlalchemy import func
+from sqlalchemy import select
+from sqlalchemy.orm import Session
+
+from danswer.db.models import ConnectorCredentialPair
+from danswer.db.models import Document
+from danswer.db.models import DocumentByConnectorCredentialPair
+from danswer.db.models import DocumentSet as DocumentSetDBModel
+from danswer.db.models import DocumentSet__ConnectorCredentialPair
+from danswer.server.models import DocumentSetCreationRequest
+from danswer.server.models import DocumentSetUpdateRequest
+
+
+def _delete_document_set_cc_pairs(
+    db_session: Session, document_set_id: int, is_current: bool | None = None
+) -> None:
+    """NOTE: does not commit transaction, this must be done by the caller"""
+    stmt = delete(DocumentSet__ConnectorCredentialPair).where(
+        DocumentSet__ConnectorCredentialPair.document_set_id == document_set_id
+    )
+    if is_current is not None:
+        stmt = stmt.where(DocumentSet__ConnectorCredentialPair.is_current == is_current)
+    db_session.execute(stmt)
+
+
+def _mark_document_set_cc_pairs_as_outdated(
+    db_session: Session, document_set_id: int
+) -> None:
+    """NOTE: does not commit transaction, this must be done by the caller"""
+    stmt = select(DocumentSet__ConnectorCredentialPair).where(
+        DocumentSet__ConnectorCredentialPair.document_set_id == document_set_id
+    )
+    for row in db_session.scalars(stmt):
+        row.is_current = False
+
+
+def get_document_set_by_id(
+    db_session: Session, document_set_id: int
+) -> DocumentSetDBModel | None:
+    return db_session.scalar(
+        select(DocumentSetDBModel).where(DocumentSetDBModel.id == document_set_id)
+    )
+
+
+def insert_document_set(
+    document_set_creation_request: DocumentSetCreationRequest,
+    user_id: UUID | None,
+    db_session: Session,
+) -> tuple[DocumentSetDBModel, list[DocumentSet__ConnectorCredentialPair]]:
+    if not document_set_creation_request.cc_pair_ids:
+        raise ValueError("Cannot create a document set with no CC pairs")
+
+    # start a transaction
+    db_session.begin()
+
+    try:
+        new_document_set_row = DocumentSetDBModel(
+            name=document_set_creation_request.name,
+            description=document_set_creation_request.description,
+            user_id=user_id,
+        )
+        db_session.add(new_document_set_row)
+        db_session.flush()  # ensure the new document set gets assigned an ID
+
+        ds_cc_pairs = [
+            DocumentSet__ConnectorCredentialPair(
+                document_set_id=new_document_set_row.id,
+                connector_credential_pair_id=cc_pair_id,
+                is_current=True,
+            )
+            for cc_pair_id in document_set_creation_request.cc_pair_ids
+        ]
+        db_session.add_all(ds_cc_pairs)
+        db_session.commit()
+    except:
+        db_session.rollback()
+        raise
+
+    return new_document_set_row, ds_cc_pairs
+
+
+def update_document_set(
+    document_set_update_request: DocumentSetUpdateRequest, db_session: Session
+) -> tuple[DocumentSetDBModel, list[DocumentSet__ConnectorCredentialPair]]:
+    if not document_set_update_request.cc_pair_ids:
+        raise ValueError("Cannot create a document set with no CC pairs")
+
+    # start a transaction
+    db_session.begin()
+
+    try:
+        # update the description
+        document_set_row = get_document_set_by_id(
+            db_session=db_session, document_set_id=document_set_update_request.id
+        )
+        if document_set_row is None:
+            raise ValueError(
+                f"No document set with ID {document_set_update_request.id}"
+            )
+        document_set_row.description = document_set_update_request.description
+        document_set_row.is_up_to_date = False
+
+        # update the attached CC pairs
+        # first, mark all existing CC pairs as not current
+        _mark_document_set_cc_pairs_as_outdated(
+            db_session=db_session, document_set_id=document_set_row.id
+        )
+        # add in rows for the new CC pairs
+        ds_cc_pairs = [
+            DocumentSet__ConnectorCredentialPair(
+                document_set_id=document_set_update_request.id,
+                connector_credential_pair_id=cc_pair_id,
+                is_current=True,
+            )
+            for cc_pair_id in document_set_update_request.cc_pair_ids
+        ]
+        db_session.add_all(ds_cc_pairs)
+        db_session.commit()
+    except:
+        db_session.rollback()
+        raise
+
+    return document_set_row, ds_cc_pairs
+
+
+def mark_document_set_as_synced(document_set_id: int, db_session: Session) -> None:
+    stmt = select(DocumentSetDBModel).where(DocumentSetDBModel.id == document_set_id)
+    document_set = db_session.scalar(stmt)
+    if document_set is None:
+        raise ValueError(f"No document set with ID: {document_set_id}")
+
+    # mark as up to date
+    document_set.is_up_to_date = True
+    # delete outdated relationship table rows
+    _delete_document_set_cc_pairs(
+        db_session=db_session, document_set_id=document_set_id, is_current=False
+    )
+    db_session.commit()
+
+
+def delete_document_set(document_set_id: int, db_session: Session) -> None:
+    # start a transaction
+    db_session.begin()
+
+    try:
+        document_set_row = get_document_set_by_id(
+            db_session=db_session, document_set_id=document_set_id
+        )
+        if document_set_row is None:
+            raise ValueError(f"No document set with ID: '{document_set_id}'")
+
+        # delete all relationships to CC pairs
+        _delete_document_set_cc_pairs(
+            db_session=db_session, document_set_id=document_set_id
+        )
+        # delete the actual document set row
+        db_session.delete(document_set_row)
+        db_session.commit()
+    except:
+        db_session.rollback()
+        raise
+
+
+def fetch_document_sets(
+    db_session: Session,
+) -> list[tuple[DocumentSetDBModel, list[ConnectorCredentialPair]]]:
+    """Return is a list where each element contains a tuple of:
+    1. The document set itself
+    2. All CC pairs associated with the document set"""
+    results = cast(
+        list[tuple[DocumentSetDBModel, ConnectorCredentialPair]],
+        db_session.execute(
+            select(DocumentSetDBModel, ConnectorCredentialPair)
+            .join(
+                DocumentSet__ConnectorCredentialPair,
+                DocumentSetDBModel.id
+                == DocumentSet__ConnectorCredentialPair.document_set_id,
+            )
+            .join(
+                ConnectorCredentialPair,
+                ConnectorCredentialPair.id
+                == DocumentSet__ConnectorCredentialPair.connector_credential_pair_id,
+            )
+            .where(
+                DocumentSet__ConnectorCredentialPair.is_current == True  # noqa: E712
+            )
+        ).all(),
+    )
+
+    aggregated_results: dict[
+        int, tuple[DocumentSetDBModel, list[ConnectorCredentialPair]]
+    ] = {}
+    for document_set, cc_pair in results:
+        if document_set.id not in aggregated_results:
+            aggregated_results[document_set.id] = (document_set, [cc_pair])
+        else:
+            aggregated_results[document_set.id][1].append(cc_pair)
+
+    return [
+        (document_set, cc_pairs)
+        for document_set, cc_pairs in aggregated_results.values()
+    ]
+
+
+def fetch_documents_for_document_set(
+    document_set_id: int, db_session: Session, current_only: bool = True
+) -> Sequence[Document]:
+    stmt = (
+        select(Document)
+        .join(
+            DocumentByConnectorCredentialPair,
+            DocumentByConnectorCredentialPair.id == Document.id,
+        )
+        .join(
+            ConnectorCredentialPair,
+            and_(
+                ConnectorCredentialPair.connector_id
+                == DocumentByConnectorCredentialPair.connector_id,
+                ConnectorCredentialPair.credential_id
+                == DocumentByConnectorCredentialPair.credential_id,
+            ),
+        )
+        .join(
+            DocumentSet__ConnectorCredentialPair,
+            DocumentSet__ConnectorCredentialPair.connector_credential_pair_id
+            == ConnectorCredentialPair.id,
+        )
+        .join(
+            DocumentSetDBModel,
+            DocumentSetDBModel.id
+            == DocumentSet__ConnectorCredentialPair.document_set_id,
+        )
+        .where(DocumentSetDBModel.id == document_set_id)
+    )
+    if current_only:
+        stmt = stmt.where(
+            DocumentSet__ConnectorCredentialPair.is_current == True  # noqa: E712
+        )
+    stmt = stmt.distinct()
+
+    return db_session.scalars(stmt).all()
+
+
+def fetch_document_sets_for_documents(
+    document_ids: list[str], db_session: Session
+) -> Sequence[tuple[str, list[str]]]:
+    stmt = (
+        select(Document.id, func.array_agg(DocumentSetDBModel.name))
+        .join(
+            DocumentSet__ConnectorCredentialPair,
+            DocumentSetDBModel.id
+            == DocumentSet__ConnectorCredentialPair.document_set_id,
+        )
+        .join(
+            ConnectorCredentialPair,
+            ConnectorCredentialPair.id
+            == DocumentSet__ConnectorCredentialPair.connector_credential_pair_id,
+        )
+        .join(
+            DocumentByConnectorCredentialPair,
+            and_(
+                DocumentByConnectorCredentialPair.connector_id
+                == ConnectorCredentialPair.connector_id,
+                DocumentByConnectorCredentialPair.credential_id
+                == ConnectorCredentialPair.credential_id,
+            ),
+        )
+        .join(
+            Document,
+            Document.id == DocumentByConnectorCredentialPair.id,
+        )
+        .where(Document.id.in_(document_ids))
+        .where(DocumentSet__ConnectorCredentialPair.is_current == True)  # noqa: E712
+        .group_by(Document.id)
+    )
+    return db_session.execute(stmt).all()  # type: ignore
diff --git a/backend/danswer/db/models.py b/backend/danswer/db/models.py
index 729ddf70b..0130fa88f 100644
--- a/backend/danswer/db/models.py
+++ b/backend/danswer/db/models.py
@@ -14,6 +14,7 @@ from sqlalchemy import ForeignKey
 from sqlalchemy import func
 from sqlalchemy import Index
 from sqlalchemy import Integer
+from sqlalchemy import Sequence
 from sqlalchemy import String
 from sqlalchemy import Text
 from sqlalchemy.dialects import postgresql
@@ -85,6 +86,17 @@ class ConnectorCredentialPair(Base):
     """
 
     __tablename__ = "connector_credential_pair"
+    # NOTE: this `id` column has to use `Sequence` instead of `autoincrement=True`
+    # due to some SQLAlchemy quirks + this not being a primary key column
+    id: Mapped[int] = mapped_column(
+        Integer,
+        Sequence("connector_credential_pair_id_seq"),
+        unique=True,
+        nullable=False,
+    )
+    name: Mapped[str] = mapped_column(
+        String, unique=True, nullable=True
+    )  # nullable for backwards compatability
     connector_id: Mapped[int] = mapped_column(
         ForeignKey("connector.id"), primary_key=True
     )
@@ -242,6 +254,7 @@ class DocumentByConnectorCredentialPair(Base):
     __tablename__ = "document_by_connector_credential_pair"
 
     id: Mapped[str] = mapped_column(ForeignKey("document.id"), primary_key=True)
+    # TODO: transition this to use the ConnectorCredentialPair id directly
     connector_id: Mapped[int] = mapped_column(
         ForeignKey("connector.id"), primary_key=True
     )
@@ -326,6 +339,49 @@ class Document(Base):
     )
 
 
+class DocumentSet(Base):
+    __tablename__ = "document_set"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    name: Mapped[str] = mapped_column(String, unique=True)
+    description: Mapped[str] = mapped_column(String)
+    user_id: Mapped[UUID | None] = mapped_column(ForeignKey("user.id"), nullable=True)
+    # whether or not changes to the document set have been propogated
+    is_up_to_date: Mapped[bool] = mapped_column(Boolean, nullable=False, default=False)
+
+    connector_credential_pair_relationships: Mapped[
+        list["DocumentSet__ConnectorCredentialPair"]
+    ] = relationship(
+        "DocumentSet__ConnectorCredentialPair", back_populates="document_set"
+    )
+
+
+class DocumentSet__ConnectorCredentialPair(Base):
+    __tablename__ = "document_set__connector_credential_pair"
+
+    document_set_id: Mapped[int] = mapped_column(
+        ForeignKey("document_set.id"), primary_key=True
+    )
+    connector_credential_pair_id: Mapped[int] = mapped_column(
+        ForeignKey("connector_credential_pair.id"), primary_key=True
+    )
+    # if `True`, then is part of the current state of the document set
+    # if `False`, then is a part of the prior state of the document set
+    # rows with `is_current=False` should be deleted when the document
+    # set is updated and should not exist for a given document set if
+    # `DocumentSet.is_up_to_date == True`
+    is_current: Mapped[bool] = mapped_column(
+        Boolean,
+        nullable=False,
+        default=True,
+        primary_key=True,
+    )
+
+    document_set: Mapped[DocumentSet] = relationship(
+        "DocumentSet", back_populates="connector_credential_pair_relationships"
+    )
+
+
 class ChatSession(Base):
     __tablename__ = "chat_session"
 
diff --git a/backend/danswer/document_set/document_set.py b/backend/danswer/document_set/document_set.py
new file mode 100644
index 000000000..0b9ca99b5
--- /dev/null
+++ b/backend/danswer/document_set/document_set.py
@@ -0,0 +1,65 @@
+from sqlalchemy.orm import Session
+
+from danswer.datastores.document_index import get_default_document_index
+from danswer.datastores.interfaces import DocumentIndex
+from danswer.datastores.interfaces import UpdateRequest
+from danswer.db.document import prepare_to_modify_documents
+from danswer.db.document_set import fetch_document_sets_for_documents
+from danswer.db.document_set import fetch_documents_for_document_set
+from danswer.db.document_set import mark_document_set_as_synced
+from danswer.db.engine import get_sqlalchemy_engine
+from danswer.utils.batching import batch_generator
+from danswer.utils.logger import setup_logger
+
+logger = setup_logger()
+
+_SYNC_BATCH_SIZE = 1000
+
+
+def _sync_document_batch(
+    document_ids: list[str], document_index: DocumentIndex
+) -> None:
+    logger.debug(f"Syncing document sets for: {document_ids}")
+    # begin a transaction, release lock at the end
+    with Session(get_sqlalchemy_engine()) as db_session:
+        # acquires a lock on the documents so that no other process can modify them
+        prepare_to_modify_documents(db_session=db_session, document_ids=document_ids)
+
+        # get current state of document sets for these documents
+        document_set_map = {
+            document_id: document_sets
+            for document_id, document_sets in fetch_document_sets_for_documents(
+                document_ids=document_ids, db_session=db_session
+            )
+        }
+
+        # update Vespa
+        document_index.update(
+            update_requests=[
+                UpdateRequest(
+                    document_ids=[document_id],
+                    document_sets=set(document_set_map.get(document_id, [])),
+                )
+                for document_id in document_ids
+            ]
+        )
+
+
+def sync_document_set(document_set_id: int) -> None:
+    document_index = get_default_document_index()
+    with Session(get_sqlalchemy_engine()) as db_session:
+        documents_to_update = fetch_documents_for_document_set(
+            document_set_id=document_set_id,
+            db_session=db_session,
+            current_only=False,
+        )
+        for document_batch in batch_generator(documents_to_update, _SYNC_BATCH_SIZE):
+            _sync_document_batch(
+                document_ids=[document.id for document in document_batch],
+                document_index=document_index,
+            )
+
+        mark_document_set_as_synced(
+            document_set_id=document_set_id, db_session=db_session
+        )
+    logger.info(f"Document set sync for '{document_set_id}' complete!")
diff --git a/backend/danswer/main.py b/backend/danswer/main.py
index 6c3063f4f..70b9e1584 100644
--- a/backend/danswer/main.py
+++ b/backend/danswer/main.py
@@ -37,6 +37,7 @@ from danswer.db.credentials import create_initial_public_credential
 from danswer.direct_qa.llm_utils import get_default_qa_model
 from danswer.server.chat_backend import router as chat_router
 from danswer.server.credential import router as credential_router
+from danswer.server.document_set import router as document_set_router
 from danswer.server.event_loading import router as event_processing_router
 from danswer.server.health import router as health_router
 from danswer.server.manage import router as admin_router
@@ -77,6 +78,7 @@ def get_application() -> FastAPI:
     application.include_router(admin_router)
     application.include_router(user_router)
     application.include_router(credential_router)
+    application.include_router(document_set_router)
     application.include_router(health_router)
 
     application.include_router(
diff --git a/backend/danswer/server/document_set.py b/backend/danswer/server/document_set.py
new file mode 100644
index 000000000..f0a2f9886
--- /dev/null
+++ b/backend/danswer/server/document_set.py
@@ -0,0 +1,101 @@
+from fastapi import APIRouter
+from fastapi import Depends
+from fastapi import HTTPException
+from sqlalchemy.orm import Session
+
+from danswer.auth.users import current_admin_user
+from danswer.auth.users import current_user
+from danswer.db.document_set import delete_document_set as delete_document_set_from_db
+from danswer.db.document_set import fetch_document_sets
+from danswer.db.document_set import insert_document_set
+from danswer.db.document_set import update_document_set
+from danswer.db.engine import get_session
+from danswer.db.models import User
+from danswer.server.models import ConnectorCredentialPairDescriptor
+from danswer.server.models import ConnectorSnapshot
+from danswer.server.models import CredentialSnapshot
+from danswer.server.models import DocumentSet
+from danswer.server.models import DocumentSetCreationRequest
+from danswer.server.models import DocumentSetUpdateRequest
+
+
+router = APIRouter(prefix="/manage")
+
+
+@router.post("/admin/document-set")
+def create_document_set(
+    document_set_creation_request: DocumentSetCreationRequest,
+    user: User = Depends(current_admin_user),
+    db_session: Session = Depends(get_session),
+) -> int:
+    try:
+        document_set_db_model, _ = insert_document_set(
+            document_set_creation_request=document_set_creation_request,
+            user_id=user.id if user else None,
+            db_session=db_session,
+        )
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+    return document_set_db_model.id
+
+
+@router.patch("/admin/document-set")
+def patch_document_set(
+    document_set_update_request: DocumentSetUpdateRequest,
+    _: User = Depends(current_admin_user),
+    db_session: Session = Depends(get_session),
+) -> None:
+    try:
+        update_document_set(
+            document_set_update_request=document_set_update_request,
+            db_session=db_session,
+        )
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+
+
+@router.delete("/admin/document-set/{document_set_id}")
+def delete_document_set(
+    document_set_id: int,
+    _: User = Depends(current_admin_user),
+    db_session: Session = Depends(get_session),
+) -> None:
+    try:
+        delete_document_set_from_db(
+            document_set_id=document_set_id, db_session=db_session
+        )
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+
+
+"""Endpoints for non-admins"""
+
+
+@router.get("/document-set")
+def list_document_sets(
+    _: User = Depends(current_user),
+    db_session: Session = Depends(get_session),
+) -> list[DocumentSet]:
+    document_set_info = fetch_document_sets(db_session=db_session)
+    return [
+        DocumentSet(
+            id=document_set_db_model.id,
+            name=document_set_db_model.name,
+            description=document_set_db_model.description,
+            cc_pair_descriptors=[
+                ConnectorCredentialPairDescriptor(
+                    id=cc_pair.id,
+                    name=cc_pair.name,
+                    connector=ConnectorSnapshot.from_connector_db_model(
+                        cc_pair.connector
+                    ),
+                    credential=CredentialSnapshot.from_credential_db_model(
+                        cc_pair.credential
+                    ),
+                )
+                for cc_pair in cc_pairs
+            ],
+            is_up_to_date=document_set_db_model.is_up_to_date,
+        )
+        for document_set_db_model, cc_pairs in document_set_info
+    ]
diff --git a/backend/danswer/server/manage.py b/backend/danswer/server/manage.py
index 3803e3296..82dc35b9d 100644
--- a/backend/danswer/server/manage.py
+++ b/backend/danswer/server/manage.py
@@ -8,12 +8,13 @@ from fastapi import HTTPException
 from fastapi import Request
 from fastapi import Response
 from fastapi import UploadFile
+from sqlalchemy.exc import IntegrityError
 from sqlalchemy.orm import Session
 
 from danswer.auth.users import current_admin_user
 from danswer.auth.users import current_user
-from danswer.background.celery import cleanup_connector_credential_pair_task
-from danswer.background.celery import get_deletion_status
+from danswer.background.celery.celery import cleanup_connector_credential_pair_task
+from danswer.background.celery.deletion_utils import get_deletion_status
 from danswer.background.connector_deletion import (
     get_cleanup_task_id,
 )
@@ -69,6 +70,7 @@ from danswer.server.models import BoostDoc
 from danswer.server.models import BoostUpdateRequest
 from danswer.server.models import ConnectorBase
 from danswer.server.models import ConnectorCredentialPairIdentifier
+from danswer.server.models import ConnectorCredentialPairMetadata
 from danswer.server.models import ConnectorIndexingStatus
 from danswer.server.models import ConnectorSnapshot
 from danswer.server.models import CredentialSnapshot
@@ -316,6 +318,8 @@ def get_connector_indexing_status(
         )
         indexing_statuses.append(
             ConnectorIndexingStatus(
+                cc_pair_id=cc_pair.id,
+                name=cc_pair.name,
                 connector=ConnectorSnapshot.from_connector_db_model(connector),
                 credential=CredentialSnapshot.from_credential_db_model(credential),
                 public_doc=credential.public_doc,
@@ -390,8 +394,11 @@ def delete_connector_by_id(
     _: User = Depends(current_admin_user),
     db_session: Session = Depends(get_session),
 ) -> StatusResponse[int]:
-    with db_session.begin():
-        return delete_connector(db_session=db_session, connector_id=connector_id)
+    try:
+        with db_session.begin():
+            return delete_connector(db_session=db_session, connector_id=connector_id)
+    except AssertionError:
+        raise HTTPException(status_code=400, detail="Connector is not deletable")
 
 
 @router.post("/admin/connector/run-once")
@@ -650,10 +657,20 @@ def get_connector_by_id(
 def associate_credential_to_connector(
     connector_id: int,
     credential_id: int,
+    metadata: ConnectorCredentialPairMetadata,
     user: User = Depends(current_user),
     db_session: Session = Depends(get_session),
 ) -> StatusResponse[int]:
-    return add_credential_to_connector(connector_id, credential_id, user, db_session)
+    try:
+        return add_credential_to_connector(
+            connector_id=connector_id,
+            credential_id=credential_id,
+            cc_pair_name=metadata.name,
+            user=user,
+            db_session=db_session,
+        )
+    except IntegrityError:
+        raise HTTPException(status_code=400, detail="Name must be unique")
 
 
 @router.delete("/connector/{connector_id}/credential/{credential_id}")
diff --git a/backend/danswer/server/models.py b/backend/danswer/server/models.py
index 6c7ecbe78..24a9474bd 100644
--- a/backend/danswer/server/models.py
+++ b/backend/danswer/server/models.py
@@ -333,6 +333,8 @@ class CredentialSnapshot(CredentialBase):
 class ConnectorIndexingStatus(BaseModel):
     """Represents the latest indexing status of a connector"""
 
+    cc_pair_id: int
+    name: str | None
     connector: ConnectorSnapshot
     credential: CredentialSnapshot
     owner: str
@@ -351,5 +353,36 @@ class ConnectorCredentialPairIdentifier(BaseModel):
     credential_id: int
 
 
+class ConnectorCredentialPairMetadata(BaseModel):
+    name: str | None
+
+
+class ConnectorCredentialPairDescriptor(BaseModel):
+    id: int
+    name: str | None
+    connector: ConnectorSnapshot
+    credential: CredentialSnapshot
+
+
 class ApiKey(BaseModel):
     api_key: str
+
+
+class DocumentSetCreationRequest(BaseModel):
+    name: str
+    description: str
+    cc_pair_ids: list[int]
+
+
+class DocumentSetUpdateRequest(BaseModel):
+    id: int
+    description: str
+    cc_pair_ids: list[int]
+
+
+class DocumentSet(BaseModel):
+    id: int
+    name: str
+    description: str
+    cc_pair_descriptors: list[ConnectorCredentialPairDescriptor]
+    is_up_to_date: bool
diff --git a/backend/supervisord.conf b/backend/supervisord.conf
index 47e2c17d8..b28fa0024 100644
--- a/backend/supervisord.conf
+++ b/backend/supervisord.conf
@@ -24,6 +24,13 @@ stdout_logfile_maxbytes=52428800
 redirect_stderr=true
 autorestart=true
 
+[program:document_set_sync]
+command=python danswer/background/document_set_sync_script.py
+stdout_logfile=/var/log/document_set_sync.log
+stdout_logfile_maxbytes=52428800
+redirect_stderr=true
+autorestart=true
+
 # Listens for slack messages and responds with answers
 # for all channels that the DanswerBot has been added to.
 # If not setup, this will just fail 5 times and then stop.
@@ -39,7 +46,7 @@ startsecs=60
 
 # pushes all logs from the above programs to stdout
 [program:log-redirect-handler]
-command=tail -qF /var/log/update.log /var/log/celery.log /var/log/file_deletion.log /var/log/slack_bot_listener.log
+command=tail -qF /var/log/update.log /var/log/celery.log /var/log/file_deletion.log /var/log/slack_bot_listener.log /var/log/document_set_sync.log
 stdout_logfile=/dev/stdout
 stdout_logfile_maxbytes=0
 redirect_stderr=true
diff --git a/web/src/app/admin/connectors/bookstack/page.tsx b/web/src/app/admin/connectors/bookstack/page.tsx
index d32985db7..86a95c1ea 100644
--- a/web/src/app/admin/connectors/bookstack/page.tsx
+++ b/web/src/app/admin/connectors/bookstack/page.tsx
@@ -9,6 +9,7 @@ import {
   BookstackCredentialJson,
   BookstackConfig,
   ConnectorIndexingStatus,
+  Credential,
 } from "@/lib/types";
 import useSWR, { useSWRConfig } from "swr";
 import { fetcher } from "@/lib/fetcher";
@@ -60,9 +61,10 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "bookstack"
   );
-  const bookstackCredential = credentialsData.filter(
-    (credential) => credential.credential_json?.bookstack_api_token_id
-  )[0];
+  const bookstackCredential: Credential<BookstackCredentialJson> | undefined =
+    credentialsData.find(
+      (credential) => credential.credential_json?.bookstack_api_token_id
+    );
 
   return (
     <>
@@ -198,21 +200,14 @@ const Main = () => {
               </p>
               <ConnectorForm<BookstackConfig>
                 nameBuilder={(values) => `BookStackConnector`}
+                ccPairNameBuilder={(values) => `BookStackConnector`}
                 source="bookstack"
                 inputType="poll"
                 formBody={<></>}
                 validationSchema={Yup.object().shape({})}
                 initialValues={{}}
                 refreshFreq={10 * 60} // 10 minutes
-                onSubmit={async (isSuccess, responseJson) => {
-                  if (isSuccess && responseJson) {
-                    await linkCredential(
-                      responseJson.id,
-                      bookstackCredential.id
-                    );
-                    mutate("/api/manage/admin/connector/indexing-status");
-                  }
-                }}
+                credentialId={bookstackCredential.id}
               />
             </div>
           </>
diff --git a/web/src/app/admin/connectors/confluence/page.tsx b/web/src/app/admin/connectors/confluence/page.tsx
index a526923e6..d0a8ea50b 100644
--- a/web/src/app/admin/connectors/confluence/page.tsx
+++ b/web/src/app/admin/connectors/confluence/page.tsx
@@ -9,6 +9,7 @@ import {
   ConfluenceCredentialJson,
   ConfluenceConfig,
   ConnectorIndexingStatus,
+  Credential,
 } from "@/lib/types";
 import useSWR, { useSWRConfig } from "swr";
 import { fetcher } from "@/lib/fetcher";
@@ -19,6 +20,17 @@ import { ConnectorsTable } from "@/components/admin/connectors/table/ConnectorsT
 import { usePopup } from "@/components/admin/connectors/Popup";
 import { usePublicCredentials } from "@/lib/hooks";
 
+// Copied from the `extract_confluence_keys_from_url` function
+const extractSpaceFromUrl = (wikiUrl: string): string | null => {
+  if (!wikiUrl.includes(".atlassian.net/wiki/spaces/")) {
+    return null;
+  }
+
+  const parsedUrl = new URL(wikiUrl);
+  const space = parsedUrl.pathname.split("/")[3];
+  return space;
+};
+
 const Main = () => {
   const { popup, setPopup } = usePopup();
 
@@ -60,9 +72,10 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "confluence"
   );
-  const confluenceCredential = credentialsData.filter(
-    (credential) => credential.credential_json?.confluence_access_token
-  )[0];
+  const confluenceCredential: Credential<ConfluenceCredentialJson> | undefined =
+    credentialsData.find(
+      (credential) => credential.credential_json?.confluence_access_token
+    );
 
   return (
     <>
@@ -226,6 +239,9 @@ const Main = () => {
               nameBuilder={(values) =>
                 `ConfluenceConnector-${values.wiki_page_url}`
               }
+              ccPairNameBuilder={(values) =>
+                extractSpaceFromUrl(values.wiki_page_url)
+              }
               source="confluence"
               inputType="poll"
               formBody={
@@ -242,15 +258,7 @@ const Main = () => {
                 wiki_page_url: "",
               }}
               refreshFreq={10 * 60} // 10 minutes
-              onSubmit={async (isSuccess, responseJson) => {
-                if (isSuccess && responseJson) {
-                  await linkCredential(
-                    responseJson.id,
-                    confluenceCredential.id
-                  );
-                  mutate("/api/manage/admin/connector/indexing-status");
-                }
-              }}
+              credentialId={confluenceCredential.id}
             />
           </div>
         </>
diff --git a/web/src/app/admin/connectors/file/page.tsx b/web/src/app/admin/connectors/file/page.tsx
index 1d34703b3..ce9c61af1 100644
--- a/web/src/app/admin/connectors/file/page.tsx
+++ b/web/src/app/admin/connectors/file/page.tsx
@@ -1,6 +1,7 @@
 "use client";
 
 import useSWR, { useSWRConfig } from "swr";
+import * as Yup from "yup";
 
 import { FileIcon } from "@/components/icons/icons";
 import { fetcher } from "@/lib/fetcher";
@@ -9,12 +10,13 @@ import { ConnectorIndexingStatus, FileConfig } from "@/lib/types";
 import { linkCredential } from "@/lib/credential";
 import { FileUpload } from "./FileUpload";
 import { useState } from "react";
-import { Button } from "@/components/Button";
-import { Popup, PopupSpec } from "@/components/admin/connectors/Popup";
+import { usePopup } from "@/components/admin/connectors/Popup";
 import { createConnector, runConnector } from "@/lib/connector";
 import { Spinner } from "@/components/Spinner";
 import { SingleUseConnectorsTable } from "@/components/admin/connectors/table/SingleUseConnectorsTable";
 import { LoadingAnimation } from "@/components/Loading";
+import { Form, Formik } from "formik";
+import { TextFormField } from "@/components/admin/connectors/Field";
 
 const getNameFromPath = (path: string) => {
   const pathParts = path.split("/");
@@ -24,16 +26,8 @@ const getNameFromPath = (path: string) => {
 const Main = () => {
   const [selectedFiles, setSelectedFiles] = useState<File[]>([]);
   const [filesAreUploading, setFilesAreUploading] = useState<boolean>(false);
-  const [popup, setPopup] = useState<{
-    message: string;
-    type: "success" | "error";
-  } | null>(null);
-  const setPopupWithExpiration = (popupSpec: PopupSpec | null) => {
-    setPopup(popupSpec);
-    setTimeout(() => {
-      setPopup(null);
-    }, 4000);
-  };
+  const { popup, setPopup } = usePopup();
+  console.log(popup);
 
   const { mutate } = useSWRConfig();
 
@@ -57,9 +51,8 @@ const Main = () => {
 
   return (
     <div>
-      {popup && <Popup message={popup.message} type={popup.type} />}
+      {popup}
       {filesAreUploading && <Spinner />}
-      <h2 className="font-bold mb-2 mt-6 ml-auto mr-auto">Upload Files</h2>
       <p className="text-sm mb-2">
         Specify files below, click the <b>Upload</b> button, and the contents of
         these files will be searchable via Danswer! Currently only <i>.txt</i>{" "}
@@ -83,18 +76,19 @@ const Main = () => {
           documentation.
         </a>
       </div>
-      <div className="flex">
+      <div className="flex mt-4">
         <div className="mx-auto max-w-3xl w-full">
-          <FileUpload
-            selectedFiles={selectedFiles}
-            setSelectedFiles={setSelectedFiles}
-          />
-
-          <Button
-            className="mt-4 w-48"
-            fullWidth
-            disabled={selectedFiles.length === 0}
-            onClick={async () => {
+          <Formik
+            initialValues={{
+              name: "",
+              selectedFiles: [],
+            }}
+            validationSchema={Yup.object().shape({
+              name: Yup.string().required(
+                "Please enter a descriptive name for the files"
+              ),
+            })}
+            onSubmit={async (values, formikHelpers) => {
               const uploadCreateAndTriggerConnector = async () => {
                 const formData = new FormData();
 
@@ -108,7 +102,7 @@ const Main = () => {
                 );
                 const responseJson = await response.json();
                 if (!response.ok) {
-                  setPopupWithExpiration({
+                  setPopup({
                     message: `Unable to upload files - ${responseJson.detail}`,
                     type: "error",
                   });
@@ -128,7 +122,7 @@ const Main = () => {
                     disabled: false,
                   });
                 if (connectorErrorMsg || !connector) {
-                  setPopupWithExpiration({
+                  setPopup({
                     message: `Unable to create connector - ${connectorErrorMsg}`,
                     type: "error",
                   });
@@ -137,11 +131,14 @@ const Main = () => {
 
                 const credentialResponse = await linkCredential(
                   connector.id,
-                  0
+                  0,
+                  values.name
                 );
-                if (credentialResponse.detail) {
-                  setPopupWithExpiration({
-                    message: `Unable to link connector to credential - ${credentialResponse.detail}`,
+                if (!credentialResponse.ok) {
+                  const credentialResponseJson =
+                    await credentialResponse.json();
+                  setPopup({
+                    message: `Unable to link connector to credential - ${credentialResponseJson.detail}`,
                     type: "error",
                   });
                   return;
@@ -151,7 +148,7 @@ const Main = () => {
                   0,
                 ]);
                 if (runConnectorErrorMsg) {
-                  setPopupWithExpiration({
+                  setPopup({
                     message: `Unable to run connector - ${runConnectorErrorMsg}`,
                     type: "error",
                   });
@@ -160,7 +157,8 @@ const Main = () => {
 
                 mutate("/api/manage/admin/connector/indexing-status");
                 setSelectedFiles([]);
-                setPopupWithExpiration({
+                formikHelpers.resetForm();
+                setPopup({
                   type: "success",
                   message: "Successfully uploaded files!",
                 });
@@ -175,13 +173,43 @@ const Main = () => {
               setFilesAreUploading(false);
             }}
           >
-            Upload!
-          </Button>
+            {({ values, isSubmitting }) => (
+              <Form className="p-3 border border-gray-600 rounded">
+                <h2 className="font-bold text-xl mb-2">Upload Files</h2>
+                <TextFormField
+                  name="name"
+                  label="Name:"
+                  placeholder={`A name that describes the files e.g. "Onboarding Documents"`}
+                  autoCompleteDisabled={true}
+                />
+
+                <p className="mb-1">Files:</p>
+                <FileUpload
+                  selectedFiles={selectedFiles}
+                  setSelectedFiles={setSelectedFiles}
+                />
+                <button
+                  className={
+                    "bg-slate-500 hover:bg-slate-700 text-white " +
+                    "font-bold py-2 px-4 rounded focus:outline-none " +
+                    "focus:shadow-outline w-full mx-auto mt-4"
+                  }
+                  type="submit"
+                  disabled={
+                    selectedFiles.length === 0 || !values.name || isSubmitting
+                  }
+                >
+                  Upload!
+                </button>
+              </Form>
+            )}
+          </Formik>
         </div>
       </div>
 
       {fileIndexingStatuses.length > 0 && (
         <div className="mt-6">
+          <h2 className="font-bold text-xl mb-2">Indexed Files</h2>
           <SingleUseConnectorsTable<FileConfig, {}>
             connectorIndexingStatuses={fileIndexingStatuses}
             specialColumns={[
diff --git a/web/src/app/admin/connectors/github/page.tsx b/web/src/app/admin/connectors/github/page.tsx
index 9354695f4..8b9d6263e 100644
--- a/web/src/app/admin/connectors/github/page.tsx
+++ b/web/src/app/admin/connectors/github/page.tsx
@@ -59,10 +59,10 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "github"
   );
-  const githubCredential: Credential<GithubCredentialJson> =
-    credentialsData.filter(
+  const githubCredential: Credential<GithubCredentialJson> | undefined =
+    credentialsData.find(
       (credential) => credential.credential_json?.github_access_token
-    )[0];
+    );
 
   return (
     <>
@@ -175,6 +175,9 @@ const Main = () => {
             nameBuilder={(values) =>
               `GithubConnector-${values.repo_owner}/${values.repo_name}`
             }
+            ccPairNameBuilder={(values) =>
+              `${values.repo_owner}/${values.repo_name}`
+            }
             source="github"
             inputType="load_state"
             formBody={
@@ -200,12 +203,7 @@ const Main = () => {
               include_issues: true,
             }}
             refreshFreq={10 * 60} // 10 minutes
-            onSubmit={async (isSuccess, responseJson) => {
-              if (isSuccess && responseJson) {
-                await linkCredential(responseJson.id, githubCredential.id);
-                mutate("/api/manage/admin/connector/indexing-status");
-              }
-            }}
+            credentialId={githubCredential.id}
           />
         </div>
       ) : (
diff --git a/web/src/app/admin/connectors/google-drive/page.tsx b/web/src/app/admin/connectors/google-drive/page.tsx
index d9dacaca5..189c89552 100644
--- a/web/src/app/admin/connectors/google-drive/page.tsx
+++ b/web/src/app/admin/connectors/google-drive/page.tsx
@@ -237,12 +237,7 @@ const GoogleDriveConnectorManagement = ({
             follow_shortcuts: false,
           }}
           refreshFreq={10 * 60} // 10 minutes
-          onSubmit={async (isSuccess, responseJson) => {
-            if (isSuccess && responseJson) {
-              await linkCredential(responseJson.id, liveCredential.id);
-              mutate("/api/manage/admin/connector/indexing-status");
-            }
-          }}
+          credentialId={liveCredential.id}
         />
       </div>
     </div>
diff --git a/web/src/app/admin/connectors/guru/page.tsx b/web/src/app/admin/connectors/guru/page.tsx
index 6d9c99b13..70d9c0ece 100644
--- a/web/src/app/admin/connectors/guru/page.tsx
+++ b/web/src/app/admin/connectors/guru/page.tsx
@@ -64,9 +64,8 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "guru"
   );
-  const guruCredential: Credential<GuruCredentialJson> = credentialsData.filter(
-    (credential) => credential.credential_json?.guru_user
-  )[0];
+  const guruCredential: Credential<GuruCredentialJson> | undefined =
+    credentialsData.find((credential) => credential.credential_json?.guru_user);
 
   return (
     <>
@@ -166,18 +165,14 @@ const Main = () => {
             <div className="flex">
               <ConnectorForm<GuruConfig>
                 nameBuilder={() => "GuruConnector"}
+                ccPairNameBuilder={() => "Guru"}
                 source="guru"
                 inputType="poll"
                 formBody={null}
                 validationSchema={Yup.object().shape({})}
                 initialValues={{}}
                 refreshFreq={10 * 60} // 10 minutes
-                onSubmit={async (isSuccess, responseJson) => {
-                  if (isSuccess && responseJson) {
-                    await linkCredential(responseJson.id, guruCredential.id);
-                    mutate("/api/manage/admin/connector/indexing-status");
-                  }
-                }}
+                credentialId={guruCredential.id}
               />
             </div>
           </>
diff --git a/web/src/app/admin/connectors/jira/page.tsx b/web/src/app/admin/connectors/jira/page.tsx
index 8fe05599c..3417897c7 100644
--- a/web/src/app/admin/connectors/jira/page.tsx
+++ b/web/src/app/admin/connectors/jira/page.tsx
@@ -20,6 +20,18 @@ import { ConnectorsTable } from "@/components/admin/connectors/table/ConnectorsT
 import { usePopup } from "@/components/admin/connectors/Popup";
 import { usePublicCredentials } from "@/lib/hooks";
 
+// Copied from the `extract_jira_project` function
+const extractJiraProject = (url: string): string | null => {
+  const parsedUrl = new URL(url);
+  const splitPath = parsedUrl.pathname.split("/");
+  const projectPos = splitPath.indexOf("projects");
+  if (projectPos !== -1 && splitPath.length > projectPos + 1) {
+    const jiraProject = splitPath[projectPos + 1];
+    return jiraProject;
+  }
+  return null;
+};
+
 const Main = () => {
   const { popup, setPopup } = usePopup();
 
@@ -233,6 +245,10 @@ const Main = () => {
               nameBuilder={(values) =>
                 `JiraConnector-${values.jira_project_url}`
               }
+              ccPairNameBuilder={(values) =>
+                extractJiraProject(values.jira_project_url)
+              }
+              credentialId={jiraCredential.id}
               source="jira"
               inputType="poll"
               formBody={
@@ -252,12 +268,6 @@ const Main = () => {
                 jira_project_url: "",
               }}
               refreshFreq={10 * 60} // 10 minutes
-              onSubmit={async (isSuccess, responseJson) => {
-                if (isSuccess && responseJson) {
-                  await linkCredential(responseJson.id, jiraCredential.id);
-                  mutate("/api/manage/admin/connector/indexing-status");
-                }
-              }}
             />
           </div>
         </>
diff --git a/web/src/app/admin/connectors/linear/page.tsx b/web/src/app/admin/connectors/linear/page.tsx
index 4dadee8f9..c8aacb4a6 100644
--- a/web/src/app/admin/connectors/linear/page.tsx
+++ b/web/src/app/admin/connectors/linear/page.tsx
@@ -62,10 +62,10 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "linear"
   );
-  const linearCredential: Credential<LinearCredentialJson> =
-    credentialsData.filter(
+  const linearCredential: Credential<LinearCredentialJson> | undefined =
+    credentialsData.find(
       (credential) => credential.credential_json?.linear_api_key
-    )[0];
+    );
 
   return (
     <>
@@ -185,18 +185,14 @@ const Main = () => {
               </p>
               <ConnectorForm<{}>
                 nameBuilder={() => "LinearConnector"}
+                ccPairNameBuilder={() => "Linear"}
                 source="linear"
                 inputType="poll"
                 formBody={<></>}
                 validationSchema={Yup.object().shape({})}
                 initialValues={{}}
                 refreshFreq={10 * 60} // 10 minutes
-                onSubmit={async (isSuccess, responseJson) => {
-                  if (isSuccess && responseJson) {
-                    await linkCredential(responseJson.id, linearCredential.id);
-                    mutate("/api/manage/admin/connector/indexing-status");
-                  }
-                }}
+                credentialId={linearCredential.id}
               />
             </div>
           )}
diff --git a/web/src/app/admin/connectors/notion/page.tsx b/web/src/app/admin/connectors/notion/page.tsx
index 34a2fd6a1..0be36bc1a 100644
--- a/web/src/app/admin/connectors/notion/page.tsx
+++ b/web/src/app/admin/connectors/notion/page.tsx
@@ -61,10 +61,10 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "notion"
   );
-  const notionCredential: Credential<NotionCredentialJson> =
-    credentialsData.filter(
+  const notionCredential: Credential<NotionCredentialJson> | undefined =
+    credentialsData.find(
       (credential) => credential.credential_json?.notion_integration_token
-    )[0];
+    );
 
   return (
     <>
@@ -185,19 +185,15 @@ const Main = () => {
               Press connect below to start the connection to Notion.
             </p>
             <ConnectorForm<NotionConfig>
-              nameBuilder={(values) => `NotionConnector`}
+              nameBuilder={() => `NotionConnector`}
+              ccPairNameBuilder={() => `Notion`}
               source="notion"
               inputType="poll"
               formBody={<></>}
               validationSchema={Yup.object().shape({})}
               initialValues={{}}
               refreshFreq={10 * 60} // 10 minutes
-              onSubmit={async (isSuccess, responseJson) => {
-                if (isSuccess && responseJson) {
-                  await linkCredential(responseJson.id, notionCredential.id);
-                  mutate("/api/manage/admin/connector/indexing-status");
-                }
-              }}
+              credentialId={notionCredential.id}
             />
           </div>
         </>
diff --git a/web/src/app/admin/connectors/productboard/page.tsx b/web/src/app/admin/connectors/productboard/page.tsx
index f201861b9..f6fdd3cc5 100644
--- a/web/src/app/admin/connectors/productboard/page.tsx
+++ b/web/src/app/admin/connectors/productboard/page.tsx
@@ -63,10 +63,11 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "productboard"
   );
-  const productboardCredential: Credential<ProductboardCredentialJson> =
-    credentialsData.filter(
-      (credential) => credential.credential_json?.productboard_access_token
-    )[0];
+  const productboardCredential:
+    | Credential<ProductboardCredentialJson>
+    | undefined = credentialsData.find(
+    (credential) => credential.credential_json?.productboard_access_token
+  );
 
   return (
     <>
@@ -166,21 +167,14 @@ const Main = () => {
             <div className="flex">
               <ConnectorForm<ProductboardConfig>
                 nameBuilder={() => "ProductboardConnector"}
+                ccPairNameBuilder={() => "Productboard"}
                 source="productboard"
                 inputType="poll"
                 formBody={null}
                 validationSchema={Yup.object().shape({})}
                 initialValues={{}}
                 refreshFreq={10 * 60} // 10 minutes
-                onSubmit={async (isSuccess, responseJson) => {
-                  if (isSuccess && responseJson) {
-                    await linkCredential(
-                      responseJson.id,
-                      productboardCredential.id
-                    );
-                    mutate("/api/manage/admin/connector/indexing-status");
-                  }
-                }}
+                credentialId={productboardCredential.id}
               />
             </div>
           </>
diff --git a/web/src/app/admin/connectors/slab/page.tsx b/web/src/app/admin/connectors/slab/page.tsx
index 5eb681c52..60f7842ce 100644
--- a/web/src/app/admin/connectors/slab/page.tsx
+++ b/web/src/app/admin/connectors/slab/page.tsx
@@ -9,6 +9,7 @@ import {
   ConnectorIndexingStatus,
   SlabCredentialJson,
   SlabConfig,
+  Credential,
 } from "@/lib/types";
 import useSWR, { useSWRConfig } from "swr";
 import { fetcher } from "@/lib/fetcher";
@@ -62,9 +63,10 @@ const Main = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "slab"
   );
-  const slabCredential = credentialsData.filter(
-    (credential) => credential.credential_json?.slab_bot_token
-  )[0];
+  const slabCredential: Credential<SlabCredentialJson> | undefined =
+    credentialsData.find(
+      (credential) => credential.credential_json?.slab_bot_token
+    );
 
   return (
     <>
@@ -211,6 +213,7 @@ const Main = () => {
                 <h2 className="font-bold mb-3">Add a New Space</h2>
                 <ConnectorForm<SlabConfig>
                   nameBuilder={(values) => `SlabConnector-${values.base_url}`}
+                  ccPairNameBuilder={(values) => values.base_url}
                   source="slab"
                   inputType="poll"
                   formBody={
@@ -227,12 +230,7 @@ const Main = () => {
                     base_url: "",
                   }}
                   refreshFreq={10 * 60} // 10 minutes
-                  onSubmit={async (isSuccess, responseJson) => {
-                    if (isSuccess && responseJson) {
-                      await linkCredential(responseJson.id, slabCredential.id);
-                      mutate("/api/manage/admin/connector/indexing-status");
-                    }
-                  }}
+                  credentialId={slabCredential.id}
                 />
               </div>
             </>
diff --git a/web/src/app/admin/connectors/slack/page.tsx b/web/src/app/admin/connectors/slack/page.tsx
index ffa74c4a8..a0d619d19 100644
--- a/web/src/app/admin/connectors/slack/page.tsx
+++ b/web/src/app/admin/connectors/slack/page.tsx
@@ -10,6 +10,7 @@ import {
   SlackConfig,
   SlackCredentialJson,
   ConnectorIndexingStatus,
+  Credential,
 } from "@/lib/types";
 import { adminDeleteCredential, linkCredential } from "@/lib/credential";
 import { CredentialForm } from "@/components/admin/connectors/CredentialForm";
@@ -61,9 +62,10 @@ const MainSection = () => {
     (connectorIndexingStatus) =>
       connectorIndexingStatus.connector.source === "slack"
   );
-  const slackCredential = credentialsData.filter(
-    (credential) => credential.credential_json?.slack_bot_token
-  )[0];
+  const slackCredential: Credential<SlackCredentialJson> | undefined =
+    credentialsData.find(
+      (credential) => credential.credential_json?.slack_bot_token
+    );
 
   return (
     <>
@@ -132,7 +134,7 @@ const MainSection = () => {
       )}
 
       <h2 className="font-bold mb-2 mt-6 ml-auto mr-auto">
-        Step 2: Which workspaces do you want to make searchable?
+        Step 2: Which channels do you want to make searchable?
       </h2>
 
       {slackConnectorIndexingStatuses.length > 0 && (
@@ -179,53 +181,56 @@ const MainSection = () => {
         </>
       )}
 
-      <div className="border-solid border-gray-600 border rounded-md p-6 mt-4">
-        <h2 className="font-bold mb-3">Connect to a New Workspace</h2>
-        <ConnectorForm<SlackConfig>
-          nameBuilder={(values) =>
-            values.channels
-              ? `SlackConnector-${values.workspace}-${values.channels.join(
-                  "_"
-                )}`
-              : `SlackConnector-${values.workspace}`
-          }
-          source="slack"
-          inputType="poll"
-          formBody={
-            <>
-              <TextFormField name="workspace" label="Workspace" />
-            </>
-          }
-          formBodyBuilder={TextArrayFieldBuilder({
-            name: "channels",
-            label: "Channels:",
-            subtext:
-              "Specify 0 or more channels to index. For example, specifying the channel " +
-              "'support' will cause us to only index all content " +
-              "within the '#support' channel. " +
-              "If no channels are specified, all channels in your workspace will be indexed.",
-          })}
-          validationSchema={Yup.object().shape({
-            workspace: Yup.string().required(
-              "Please enter the workspace to index"
-            ),
-            channels: Yup.array()
-              .of(Yup.string().required("Channel names must be strings"))
-              .required(),
-          })}
-          initialValues={{
-            workspace: "",
-            channels: [],
-          }}
-          refreshFreq={10 * 60} // 10 minutes
-          onSubmit={async (isSuccess, responseJson) => {
-            if (isSuccess && responseJson) {
-              await linkCredential(responseJson.id, slackCredential.id);
-              mutate("/api/manage/admin/connector/indexing-status");
+      {slackCredential ? (
+        <div className="border-solid border-gray-600 border rounded-md p-6 mt-4">
+          <h2 className="font-bold mb-3">Connect to a New Workspace</h2>
+          <ConnectorForm<SlackConfig>
+            nameBuilder={(values) =>
+              values.channels
+                ? `SlackConnector-${values.workspace}-${values.channels.join(
+                    "_"
+                  )}`
+                : `SlackConnector-${values.workspace}`
             }
-          }}
-        />
-      </div>
+            source="slack"
+            inputType="poll"
+            formBody={
+              <>
+                <TextFormField name="workspace" label="Workspace" />
+              </>
+            }
+            formBodyBuilder={TextArrayFieldBuilder({
+              name: "channels",
+              label: "Channels:",
+              subtext:
+                "Specify 0 or more channels to index. For example, specifying the channel " +
+                "'support' will cause us to only index all content " +
+                "within the '#support' channel. " +
+                "If no channels are specified, all channels in your workspace will be indexed.",
+            })}
+            validationSchema={Yup.object().shape({
+              workspace: Yup.string().required(
+                "Please enter the workspace to index"
+              ),
+              channels: Yup.array()
+                .of(Yup.string().required("Channel names must be strings"))
+                .required(),
+            })}
+            initialValues={{
+              workspace: "",
+              channels: [],
+            }}
+            refreshFreq={10 * 60} // 10 minutes
+            credentialId={slackCredential.id}
+          />
+        </div>
+      ) : (
+        <p className="text-sm">
+          Please provide your slack bot token in Step 1 first! Once done with
+          that, you can then specify which Slack channels you want to make
+          searchable.
+        </p>
+      )}
     </>
   );
 };
diff --git a/web/src/app/admin/connectors/web/page.tsx b/web/src/app/admin/connectors/web/page.tsx
index 7d0f40177..0886c2a12 100644
--- a/web/src/app/admin/connectors/web/page.tsx
+++ b/web/src/app/admin/connectors/web/page.tsx
@@ -49,6 +49,8 @@ export default function Web() {
       <div className="border-solid border-gray-600 border rounded-md p-6">
         <ConnectorForm<WebConfig>
           nameBuilder={(values) => `WebConnector-${values.base_url}`}
+          ccPairNameBuilder={(values) => values.base_url}
+          credentialId={0} // 0 is the ID of the default public credential
           source="web"
           inputType="load_state"
           formBody={
@@ -65,13 +67,6 @@ export default function Web() {
             base_url: "",
           }}
           refreshFreq={60 * 60 * 24} // 1 day
-          onSubmit={async (isSuccess, responseJson) => {
-            if (isSuccess && responseJson) {
-              // assumes there is a dummy credential with id 0
-              await linkCredential(responseJson.id, 0);
-              mutate("/api/manage/admin/connector/indexing-status");
-            }
-          }}
         />
       </div>
 
diff --git a/web/src/app/admin/connectors/zulip/page.tsx b/web/src/app/admin/connectors/zulip/page.tsx
index 51bba477a..71b348ec4 100644
--- a/web/src/app/admin/connectors/zulip/page.tsx
+++ b/web/src/app/admin/connectors/zulip/page.tsx
@@ -165,7 +165,7 @@ const MainSection = () => {
                 mutate("/api/manage/admin/connector/indexing-status")
               }
               onCredentialLink={async (connectorId) => {
-                if (Credential) {
+                if (zulipCredential) {
                   await linkCredential(connectorId, zulipCredential.id);
                   mutate("/api/manage/admin/connector/indexing-status");
                 }
@@ -179,8 +179,10 @@ const MainSection = () => {
         <h2 className="font-bold mb-3">Connect to a New Realm</h2>
         <ConnectorForm<ZulipConfig>
           nameBuilder={(values) => `ZulipConnector-${values.realm_name}`}
+          ccPairNameBuilder={(values) => values.realm_name}
           source="zulip"
           inputType="poll"
+          credentialId={zulipCredential.id}
           formBody={
             <>
               <TextFormField name="realm_name" label="Realm name:" />
@@ -196,12 +198,6 @@ const MainSection = () => {
             realm_url: "",
           }}
           refreshFreq={10 * 60} // 10 minutes
-          onSubmit={async (isSuccess, responseJson) => {
-            if (isSuccess && responseJson) {
-              await linkCredential(responseJson.id, zulipCredential.id);
-              mutate("/api/manage/admin/connector/indexing-status");
-            }
-          }}
         />
       </div>
     </>
diff --git a/web/src/app/admin/documents/sets/DocumentSetCreationForm.tsx b/web/src/app/admin/documents/sets/DocumentSetCreationForm.tsx
new file mode 100644
index 000000000..2a01a2b1c
--- /dev/null
+++ b/web/src/app/admin/documents/sets/DocumentSetCreationForm.tsx
@@ -0,0 +1,179 @@
+import { ArrayHelpers, FieldArray, Form, Formik } from "formik";
+import * as Yup from "yup";
+import { PopupSpec } from "@/components/admin/connectors/Popup";
+import { createDocumentSet, updateDocumentSet } from "./lib";
+import { ConnectorIndexingStatus, DocumentSet } from "@/lib/types";
+import { TextFormField } from "@/components/admin/connectors/Field";
+import { ConnectorTitle } from "@/components/admin/connectors/ConnectorTitle";
+
+interface SetCreationPopupProps {
+  ccPairs: ConnectorIndexingStatus<any, any>[];
+  onClose: () => void;
+  setPopup: (popupSpec: PopupSpec | null) => void;
+  existingDocumentSet?: DocumentSet<any, any>;
+}
+
+export const DocumentSetCreationForm = ({
+  ccPairs,
+  onClose,
+  setPopup,
+  existingDocumentSet,
+}: SetCreationPopupProps) => {
+  const isUpdate = existingDocumentSet !== undefined;
+
+  return (
+    <div>
+      <div
+        className="fixed inset-0 bg-black bg-opacity-50 flex items-center justify-center z-50"
+        onClick={onClose}
+      >
+        <div
+          className="bg-gray-800 p-6 rounded border border-gray-700 shadow-lg relative w-1/2 text-sm"
+          onClick={(event) => event.stopPropagation()}
+        >
+          <Formik
+            initialValues={{
+              name: existingDocumentSet ? existingDocumentSet.name : "",
+              description: existingDocumentSet
+                ? existingDocumentSet.description
+                : "",
+              ccPairIds: existingDocumentSet
+                ? existingDocumentSet.cc_pair_descriptors.map(
+                    (ccPairDescriptor) => {
+                      return ccPairDescriptor.id;
+                    }
+                  )
+                : ([] as number[]),
+            }}
+            validationSchema={Yup.object().shape({
+              name: Yup.string().required("Please enter a name for the set"),
+              description: Yup.string().required(
+                "Please enter a description for the set"
+              ),
+              ccPairIds: Yup.array()
+                .of(Yup.number().required())
+                .required("Please select at least one connector"),
+            })}
+            onSubmit={async (values, formikHelpers) => {
+              formikHelpers.setSubmitting(true);
+              let response;
+              if (isUpdate) {
+                response = await updateDocumentSet({
+                  id: existingDocumentSet.id,
+                  ...values,
+                });
+              } else {
+                response = await createDocumentSet(values);
+              }
+              formikHelpers.setSubmitting(false);
+              if (response.ok) {
+                setPopup({
+                  message: isUpdate
+                    ? "Successfully updated document set!"
+                    : "Successfully created document set!",
+                  type: "success",
+                });
+                onClose();
+              } else {
+                const errorMsg = await response.text();
+                setPopup({
+                  message: isUpdate
+                    ? `Error updating document set - ${errorMsg}`
+                    : `Error creating document set - ${errorMsg}`,
+                  type: "error",
+                });
+              }
+            }}
+          >
+            {({ isSubmitting, values }) => (
+              <Form>
+                <h2 className="text-lg font-bold mb-3">
+                  {isUpdate
+                    ? "Update a Document Set"
+                    : "Create a new Document Set"}
+                </h2>
+                <TextFormField
+                  name="name"
+                  label="Name:"
+                  placeholder="A name for the document set"
+                  disabled={isUpdate}
+                  autoCompleteDisabled={true}
+                />
+                <TextFormField
+                  name="description"
+                  label="Description:"
+                  placeholder="Describe what the document set represents"
+                  autoCompleteDisabled={true}
+                />
+                <h2 className="mb-1">Pick your connectors:</h2>
+                <p className="mb-3 text-xs">
+                  All documents indexed by the selected connectors will be a
+                  part of this document set.
+                </p>
+                <FieldArray
+                  name="ccPairIds"
+                  render={(arrayHelpers: ArrayHelpers) => (
+                    <div className="mb-3 flex gap-2 flex-wrap">
+                      {ccPairs.map((ccPair) => {
+                        const ind = values.ccPairIds.indexOf(ccPair.cc_pair_id);
+                        let isSelected = ind !== -1;
+                        return (
+                          <div
+                            key={`${ccPair.connector.id}-${ccPair.credential.id}`}
+                            className={
+                              `
+                              px-3 
+                              py-1
+                              rounded-lg 
+                              border
+                              border-gray-700 
+                              w-fit 
+                              flex 
+                              cursor-pointer ` +
+                              (isSelected
+                                ? " bg-gray-600"
+                                : " hover:bg-gray-700")
+                            }
+                            onClick={() => {
+                              if (isSelected) {
+                                arrayHelpers.remove(ind);
+                              } else {
+                                arrayHelpers.push(ccPair.cc_pair_id);
+                              }
+                            }}
+                          >
+                            <div className="my-auto">
+                              <ConnectorTitle
+                                connector={ccPair.connector}
+                                ccPairName={ccPair.name}
+                                isLink={false}
+                                showMetadata={false}
+                              />
+                            </div>
+                          </div>
+                        );
+                      })}
+                    </div>
+                  )}
+                />
+                <div className="flex">
+                  <button
+                    type="submit"
+                    disabled={isSubmitting}
+                    className={
+                      "bg-slate-500 hover:bg-slate-700 text-white " +
+                      "font-bold py-2 px-4 rounded focus:outline-none " +
+                      "focus:shadow-outline w-full max-w-sm mx-auto"
+                    }
+                  >
+                    {isUpdate ? "Update!" : "Create!"}
+                  </button>
+                </div>
+              </Form>
+            )}
+          </Formik>
+        </div>
+      </div>
+    </div>
+  );
+};
diff --git a/web/src/app/admin/documents/sets/hooks.tsx b/web/src/app/admin/documents/sets/hooks.tsx
new file mode 100644
index 000000000..879fc753f
--- /dev/null
+++ b/web/src/app/admin/documents/sets/hooks.tsx
@@ -0,0 +1,13 @@
+import { fetcher } from "@/lib/fetcher";
+import { DocumentSet } from "@/lib/types";
+import useSWR, { mutate } from "swr";
+
+export const useDocumentSets = () => {
+  const url = "/api/manage/document-set";
+  const swrResponse = useSWR<DocumentSet<any, any>[]>(url, fetcher);
+
+  return {
+    ...swrResponse,
+    refreshDocumentSets: () => mutate(url),
+  };
+};
diff --git a/web/src/app/admin/documents/sets/lib.ts b/web/src/app/admin/documents/sets/lib.ts
new file mode 100644
index 000000000..71ddcf8d9
--- /dev/null
+++ b/web/src/app/admin/documents/sets/lib.ts
@@ -0,0 +1,56 @@
+interface DocumentSetCreationRequest {
+  name: string;
+  description: string;
+  ccPairIds: number[];
+}
+
+export const createDocumentSet = async ({
+  name,
+  description,
+  ccPairIds,
+}: DocumentSetCreationRequest) => {
+  return fetch("/api/manage/admin/document-set", {
+    method: "POST",
+    headers: {
+      "Content-Type": "application/json",
+    },
+    body: JSON.stringify({
+      name,
+      description,
+      cc_pair_ids: ccPairIds,
+    }),
+  });
+};
+
+interface DocumentSetUpdateRequest {
+  id: number;
+  description: string;
+  ccPairIds: number[];
+}
+
+export const updateDocumentSet = async ({
+  id,
+  description,
+  ccPairIds,
+}: DocumentSetUpdateRequest) => {
+  return fetch("/api/manage/admin/document-set", {
+    method: "PATCH",
+    headers: {
+      "Content-Type": "application/json",
+    },
+    body: JSON.stringify({
+      id,
+      description,
+      cc_pair_ids: ccPairIds,
+    }),
+  });
+};
+
+export const deleteDocumentSet = async (id: number) => {
+  return fetch(`/api/manage/admin/document-set/${id}`, {
+    method: "DELETE",
+    headers: {
+      "Content-Type": "application/json",
+    },
+  });
+};
diff --git a/web/src/app/admin/documents/sets/page.tsx b/web/src/app/admin/documents/sets/page.tsx
new file mode 100644
index 000000000..6876559b0
--- /dev/null
+++ b/web/src/app/admin/documents/sets/page.tsx
@@ -0,0 +1,268 @@
+"use client";
+
+import { Button } from "@/components/Button";
+import { LoadingAnimation, ThreeDotsLoader } from "@/components/Loading";
+import { PageSelector } from "@/components/PageSelector";
+import { BasicTable } from "@/components/admin/connectors/BasicTable";
+import { BookmarkIcon, EditIcon, TrashIcon } from "@/components/icons/icons";
+import { useConnectorCredentialIndexingStatus } from "@/lib/hooks";
+import { ConnectorIndexingStatus, DocumentSet } from "@/lib/types";
+import { useState } from "react";
+import { useDocumentSets } from "./hooks";
+import { DocumentSetCreationForm } from "./DocumentSetCreationForm";
+import { ConnectorTitle } from "@/components/admin/connectors/ConnectorTitle";
+import { deleteDocumentSet } from "./lib";
+import { PopupSpec, usePopup } from "@/components/admin/connectors/Popup";
+
+const numToDisplay = 50;
+
+const EditRow = ({
+  documentSet,
+  ccPairs,
+  setPopup,
+  refreshDocumentSets,
+}: {
+  documentSet: DocumentSet<any, any>;
+  ccPairs: ConnectorIndexingStatus<any, any>[];
+  setPopup: (popupSpec: PopupSpec | null) => void;
+  refreshDocumentSets: () => void;
+}) => {
+  const [isEditPopupOpen, setEditPopupOpen] = useState(false);
+  return (
+    <>
+      {isEditPopupOpen && (
+        <DocumentSetCreationForm
+          ccPairs={ccPairs}
+          onClose={() => {
+            setEditPopupOpen(false);
+            refreshDocumentSets();
+          }}
+          setPopup={setPopup}
+          existingDocumentSet={documentSet}
+        />
+      )}
+      <div
+        className="cursor-pointer my-auto"
+        onClick={() => setEditPopupOpen(true)}
+      >
+        <EditIcon />
+      </div>
+    </>
+  );
+};
+
+interface DocumentFeedbackTableProps {
+  documentSets: DocumentSet<any, any>[];
+  ccPairs: ConnectorIndexingStatus<any, any>[];
+  refresh: () => void;
+  setPopup: (popupSpec: PopupSpec | null) => void;
+}
+
+const DocumentSetTable = ({
+  documentSets,
+  ccPairs,
+  refresh,
+  setPopup,
+}: DocumentFeedbackTableProps) => {
+  const [page, setPage] = useState(1);
+
+  // sort by name for consistent ordering
+  documentSets.sort((a, b) => {
+    if (a.name < b.name) {
+      return -1;
+    } else if (a.name > b.name) {
+      return 1;
+    } else {
+      return 0;
+    }
+  });
+
+  return (
+    <div>
+      <BasicTable
+        columns={[
+          {
+            header: "Name",
+            key: "name",
+          },
+          {
+            header: "Connectors",
+            key: "ccPairs",
+          },
+          {
+            header: "Status",
+            key: "status",
+          },
+          {
+            header: "Delete",
+            key: "delete",
+            width: "50px",
+          },
+        ]}
+        data={documentSets
+          .slice((page - 1) * numToDisplay, page * numToDisplay)
+          .map((documentSet) => {
+            return {
+              name: (
+                <div className="flex gap-x-2">
+                  <EditRow
+                    documentSet={documentSet}
+                    ccPairs={ccPairs}
+                    setPopup={setPopup}
+                    refreshDocumentSets={refresh}
+                  />{" "}
+                  <b className="my-auto">{documentSet.name}</b>
+                </div>
+              ),
+              ccPairs: (
+                <div>
+                  {documentSet.cc_pair_descriptors.map(
+                    (ccPairDescriptor, ind) => {
+                      return (
+                        <div
+                          className={
+                            ind !== documentSet.cc_pair_descriptors.length - 1
+                              ? "mb-3"
+                              : ""
+                          }
+                          key={ccPairDescriptor.id}
+                        >
+                          <ConnectorTitle
+                            connector={ccPairDescriptor.connector}
+                            ccPairName={ccPairDescriptor.name}
+                            showMetadata={false}
+                          />
+                        </div>
+                      );
+                    }
+                  )}
+                </div>
+              ),
+              status: documentSet.is_up_to_date ? (
+                <div className="text-emerald-600">Up to date!</div>
+              ) : (
+                <div className="text-gray-300 w-10">
+                  <LoadingAnimation text="Syncing" />
+                </div>
+              ),
+              delete: (
+                <div
+                  className="cursor-pointer"
+                  onClick={async () => {
+                    const response = await deleteDocumentSet(documentSet.id);
+                    if (response.ok) {
+                      setPopup({
+                        message: `Document set "${documentSet.name}" deleted`,
+                        type: "success",
+                      });
+                    } else {
+                      const errorMsg = await response.text();
+                      setPopup({
+                        message: `Failed to delete document set - ${errorMsg}`,
+                        type: "error",
+                      });
+                    }
+                    refresh();
+                  }}
+                >
+                  <TrashIcon />
+                </div>
+              ),
+            };
+          })}
+      />
+      <div className="mt-3 flex">
+        <div className="mx-auto">
+          <PageSelector
+            totalPages={Math.ceil(documentSets.length / numToDisplay)}
+            currentPage={page}
+            onPageChange={(newPage) => setPage(newPage)}
+          />
+        </div>
+      </div>
+    </div>
+  );
+};
+
+const Main = () => {
+  const [isOpen, setIsOpen] = useState(false);
+  const { popup, setPopup } = usePopup();
+  const {
+    data: documentSets,
+    isLoading: isDocumentSetsLoading,
+    error: documentSetsError,
+    refreshDocumentSets,
+  } = useDocumentSets();
+
+  const {
+    data: ccPairs,
+    isLoading: isCCPairsLoading,
+    error: ccPairsError,
+  } = useConnectorCredentialIndexingStatus();
+
+  if (isDocumentSetsLoading || isCCPairsLoading) {
+    return <ThreeDotsLoader />;
+  }
+
+  if (documentSetsError || !documentSets) {
+    return <div>Error: {documentSetsError}</div>;
+  }
+
+  if (ccPairsError || !ccPairs) {
+    return <div>Error: {ccPairsError}</div>;
+  }
+
+  return (
+    <div className="mb-8">
+      {popup}
+      <div className="text-sm mb-3">
+        <b>Document Sets</b> allow you to group logically connected documents
+        into a single bundle. These can then be used as filter when performing
+        searches in the web UI or attached to slack bots to limit the amount of
+        information the bot searches over when answering in a specific channel
+        or with a certain command.
+      </div>
+
+      <div className="mb-2"></div>
+
+      <div className="flex mb-3">
+        <Button className="ml-2 my-auto" onClick={() => setIsOpen(true)}>
+          New Document Set
+        </Button>
+      </div>
+
+      <DocumentSetTable
+        documentSets={documentSets}
+        ccPairs={ccPairs}
+        refresh={refreshDocumentSets}
+        setPopup={setPopup}
+      />
+
+      {isOpen && (
+        <DocumentSetCreationForm
+          ccPairs={ccPairs}
+          onClose={() => {
+            refreshDocumentSets();
+            setIsOpen(false);
+          }}
+          setPopup={setPopup}
+        />
+      )}
+    </div>
+  );
+};
+
+const Page = () => {
+  return (
+    <div>
+      <div className="border-solid border-gray-600 border-b pb-2 mb-4 flex">
+        <BookmarkIcon size={32} />
+        <h1 className="text-3xl font-bold pl-2">Document Sets</h1>
+      </div>
+
+      <Main />
+    </div>
+  );
+};
+
+export default Page;
diff --git a/web/src/app/admin/indexing/status/page.tsx b/web/src/app/admin/indexing/status/page.tsx
index c4b919364..07963d0d4 100644
--- a/web/src/app/admin/indexing/status/page.tsx
+++ b/web/src/app/admin/indexing/status/page.tsx
@@ -12,110 +12,12 @@ import {
 } from "@/components/icons/icons";
 import { fetcher } from "@/lib/fetcher";
 import { getSourceMetadata } from "@/components/source";
-import { CheckCircle, XCircle } from "@phosphor-icons/react";
+import { CheckCircle } from "@phosphor-icons/react";
 import { HealthCheckBanner } from "@/components/health/healthcheck";
-import {
-  ConfluenceConfig,
-  Connector,
-  ConnectorIndexingStatus,
-  GithubConfig,
-  GoogleDriveConfig,
-  JiraConfig,
-  SlackConfig,
-  WebConfig,
-  ZulipConfig,
-} from "@/lib/types";
+import { ConnectorIndexingStatus } from "@/lib/types";
 import { useState } from "react";
 import { getDocsProcessedPerMinute } from "@/lib/indexAttempt";
-
-interface ConnectorTitleProps {
-  connectorIndexingStatus: ConnectorIndexingStatus<any, any>;
-}
-
-const ConnectorTitle = ({ connectorIndexingStatus }: ConnectorTitleProps) => {
-  const connector = connectorIndexingStatus.connector;
-  const sourceMetadata = getSourceMetadata(connector.source);
-
-  let additionalMetadata = new Map<string, string>();
-  if (connector.source === "web") {
-    const typedConnector = connector as Connector<WebConfig>;
-    additionalMetadata.set(
-      "Base URL",
-      typedConnector.connector_specific_config.base_url
-    );
-  } else if (connector.source === "github") {
-    const typedConnector = connector as Connector<GithubConfig>;
-    additionalMetadata.set(
-      "Repo",
-      `${typedConnector.connector_specific_config.repo_owner}/${typedConnector.connector_specific_config.repo_name}`
-    );
-  } else if (connector.source === "confluence") {
-    const typedConnector = connector as Connector<ConfluenceConfig>;
-    additionalMetadata.set(
-      "Wiki URL",
-      typedConnector.connector_specific_config.wiki_page_url
-    );
-  } else if (connector.source === "jira") {
-    const typedConnector = connector as Connector<JiraConfig>;
-    additionalMetadata.set(
-      "Jira Project URL",
-      typedConnector.connector_specific_config.jira_project_url
-    );
-  } else if (connector.source === "google_drive") {
-    const typedConnector = connector as Connector<GoogleDriveConfig>;
-    if (
-      typedConnector.connector_specific_config?.folder_paths &&
-      typedConnector.connector_specific_config?.folder_paths.length > 0
-    ) {
-      additionalMetadata.set(
-        "Folders",
-        typedConnector.connector_specific_config.folder_paths.join(", ")
-      );
-    }
-
-    if (!connectorIndexingStatus.public_doc && connectorIndexingStatus.owner) {
-      additionalMetadata.set("Owner", connectorIndexingStatus.owner);
-    }
-  } else if (connector.source === "slack") {
-    const typedConnector = connector as Connector<SlackConfig>;
-    if (
-      typedConnector.connector_specific_config?.channels &&
-      typedConnector.connector_specific_config?.channels.length > 0
-    ) {
-      additionalMetadata.set(
-        "Channels",
-        typedConnector.connector_specific_config.channels.join(", ")
-      );
-    }
-  } else if (connector.source === "zulip") {
-    const typedConnector = connector as Connector<ZulipConfig>;
-    additionalMetadata.set(
-      "Realm",
-      typedConnector.connector_specific_config.realm_name
-    );
-  }
-
-  return (
-    <>
-      <a
-        className="text-blue-500 flex w-fit"
-        href={sourceMetadata.adminPageLink}
-      >
-        {sourceMetadata.icon({ size: 20 })}
-        <div className="ml-1">{sourceMetadata.displayName}</div>
-      </a>
-      <div className="text-xs text-gray-300 mt-1">
-        {Array.from(additionalMetadata.entries()).map(([key, value]) => {
-          return (
-            <div key={key}>
-              <i>{key}:</i> {value}
-            </div>
-          );
-        })}
-      </div>
-    </>
-  );
-};
+import { ConnectorTitle } from "@/components/admin/connectors/ConnectorTitle";
 
 const ErrorDisplay = ({ message }: { message: string }) => {
   const [isHovered, setIsHovered] = useState(false);
@@ -247,7 +149,12 @@ function Main() {
             ? `${connectorIndexingStatus?.docs_indexed} documents`
             : "-",
           connector: (
-            <ConnectorTitle connectorIndexingStatus={connectorIndexingStatus} />
+            <ConnectorTitle
+              ccPairName={connectorIndexingStatus.name}
+              connector={connectorIndexingStatus.connector}
+              isPublic={connectorIndexingStatus.credential.public_doc}
+              owner={connectorIndexingStatus.owner}
+            />
           ),
           status: statusDisplay,
           // TODO: add the below back in after this is supported in the backend
diff --git a/web/src/app/admin/layout.tsx b/web/src/app/admin/layout.tsx
index 7c9edba2d..112a2f8e0 100644
--- a/web/src/app/admin/layout.tsx
+++ b/web/src/app/admin/layout.tsx
@@ -19,6 +19,7 @@ import {
   LinearIcon,
   UsersIcon,
   ThumbsUpIcon,
+  BookmarkIcon,
 } from "@/components/icons/icons";
 import { DISABLE_AUTH } from "@/lib/constants";
 import { getCurrentUserSS } from "@/lib/userSS";
@@ -223,6 +224,15 @@ export default async function AdminLayout({
             {
               name: "Document Management",
               items: [
+                {
+                  name: (
+                    <div className="flex">
+                      <BookmarkIcon size={18} />
+                      <div className="ml-1">Document Sets</div>
+                    </div>
+                  ),
+                  link: "/admin/documents/sets",
+                },
                 {
                   name: (
                     <div className="flex">
diff --git a/web/src/components/Loading.tsx b/web/src/components/Loading.tsx
index b063b2874..7cdcb5a98 100644
--- a/web/src/components/Loading.tsx
+++ b/web/src/components/Loading.tsx
@@ -1,5 +1,6 @@
 import React, { useState, useEffect } from "react";
 import "./loading.css";
+import { ThreeDots } from "react-loader-spinner";
 
 interface LoadingAnimationProps {
   text?: string;
@@ -40,3 +41,22 @@ export const LoadingAnimation: React.FC<LoadingAnimationProps> = ({
     </div>
   );
 };
+
+export const ThreeDotsLoader = () => {
+  return (
+    <div className="flex my-auto">
+      <div className="mx-auto">
+        <ThreeDots
+          height="30"
+          width="50"
+          color="#3b82f6"
+          ariaLabel="grid-loading"
+          radius="12.5"
+          wrapperStyle={{}}
+          wrapperClass=""
+          visible={true}
+        />
+      </div>
+    </div>
+  );
+};
diff --git a/web/src/components/admin/connectors/ConnectorForm.tsx b/web/src/components/admin/connectors/ConnectorForm.tsx
index c81ea7c56..5e30b1fcf 100644
--- a/web/src/components/admin/connectors/ConnectorForm.tsx
+++ b/web/src/components/admin/connectors/ConnectorForm.tsx
@@ -1,7 +1,7 @@
 import React, { useState } from "react";
 import { Formik, Form } from "formik";
 import * as Yup from "yup";
-import { Popup } from "./Popup";
+import { Popup, usePopup } from "./Popup";
 import {
   Connector,
   ConnectorBase,
@@ -10,6 +10,9 @@ import {
 } from "@/lib/types";
 import { deleteConnectorIfExists } from "@/lib/connector";
 import { FormBodyBuilder, RequireAtLeastOne } from "./types";
+import { TextFormField } from "./Field";
+import { linkCredential } from "@/lib/credential";
+import { useSWRConfig } from "swr";
 
 const BASE_CONNECTOR_URL = "/api/manage/admin/connector";
 
@@ -45,17 +48,25 @@ export async function submitConnector<T>(
   }
 }
 
+const CCPairNameHaver = Yup.object().shape({
+  cc_pair_name: Yup.string().required("Please enter a name for the connector"),
+});
+
 interface BaseProps<T extends Yup.AnyObject> {
   nameBuilder: (values: T) => string;
+  ccPairNameBuilder?: (values: T) => string | null;
   source: ValidSources;
   inputType: ValidInputTypes;
-  credentialId?: number;
+  credentialId?: number; // if specified, will automatically try and link the credential
   // If both are specified, will render formBody and then formBodyBuilder
   formBody?: JSX.Element | null;
   formBodyBuilder?: FormBodyBuilder<T>;
   validationSchema: Yup.ObjectSchema<T>;
   initialValues: T;
-  onSubmit: (isSuccess: boolean, responseJson?: Connector<T>) => void;
+  onSubmit?: (
+    isSuccess: boolean,
+    responseJson: Connector<T> | undefined
+  ) => void;
   refreshFreq?: number;
 }
 
@@ -66,8 +77,10 @@ type ConnectorFormProps<T extends Yup.AnyObject> = RequireAtLeastOne<
 
 export function ConnectorForm<T extends Yup.AnyObject>({
   nameBuilder,
+  ccPairNameBuilder,
   source,
   inputType,
+  credentialId,
   formBody,
   formBodyBuilder,
   validationSchema,
@@ -75,58 +88,88 @@ export function ConnectorForm<T extends Yup.AnyObject>({
   refreshFreq,
   onSubmit,
 }: ConnectorFormProps<T>): JSX.Element {
-  const [popup, setPopup] = useState<{
-    message: string;
-    type: "success" | "error";
-  } | null>(null);
+  const { mutate } = useSWRConfig();
+  const { popup, setPopup } = usePopup();
+
+  const shouldHaveNameInput = credentialId !== undefined && !ccPairNameBuilder;
 
   return (
     <>
-      {popup && <Popup message={popup.message} type={popup.type} />}
+      {popup}
       <Formik
-        initialValues={initialValues}
-        validationSchema={validationSchema}
+        initialValues={
+          shouldHaveNameInput
+            ? { cc_pair_name: "", ...initialValues }
+            : initialValues
+        }
+        validationSchema={
+          shouldHaveNameInput
+            ? validationSchema.concat(CCPairNameHaver)
+            : validationSchema
+        }
         onSubmit={async (values, formikHelpers) => {
           formikHelpers.setSubmitting(true);
           const connectorName = nameBuilder(values);
-
-          // best effort check to see if existing connector exists
-          // delete it if it does, the current assumption is that only
-          // one google drive connector will exist at a time
-          const errorMsg = await deleteConnectorIfExists({
-            source,
-            name: connectorName,
-          });
-          if (errorMsg) {
-            setPopup({
-              message: `Unable to delete existing connector - ${errorMsg}`,
-              type: "error",
-            });
-            return;
-          }
-
+          const connectorConfig = Object.fromEntries(
+            Object.keys(initialValues).map((key) => [key, values[key]])
+          ) as T;
           const { message, isSuccess, response } = await submitConnector<T>({
             name: connectorName,
             source,
             input_type: inputType,
-            connector_specific_config: values,
+            connector_specific_config: connectorConfig,
             refresh_freq: refreshFreq || 0,
             disabled: false,
           });
 
+          if (!isSuccess || !response) {
+            setPopup({ message, type: "error" });
+            formikHelpers.setSubmitting(false);
+            return;
+          }
+
+          if (credentialId !== undefined) {
+            const ccPairName = ccPairNameBuilder
+              ? ccPairNameBuilder(values)
+              : values.cc_pair_name;
+            const linkCredentialResponse = await linkCredential(
+              response.id,
+              credentialId,
+              ccPairName
+            );
+            if (!linkCredentialResponse.ok) {
+              const linkCredentialErrorMsg =
+                await linkCredentialResponse.text();
+              setPopup({
+                message: `Error linking credential - ${linkCredentialErrorMsg}`,
+                type: "error",
+              });
+              formikHelpers.setSubmitting(false);
+              return;
+            }
+          }
+
+          mutate("/api/manage/admin/connector/indexing-status");
           setPopup({ message, type: isSuccess ? "success" : "error" });
           formikHelpers.setSubmitting(false);
           if (isSuccess) {
             formikHelpers.resetForm();
           }
-          setTimeout(() => {
-            setPopup(null);
-          }, 4000);
-          onSubmit(isSuccess, response);
+          if (onSubmit) {
+            onSubmit(isSuccess, response);
+          }
         }}
       >
         {({ isSubmitting, values }) => (
           <Form>
+            {shouldHaveNameInput && (
+              <TextFormField
+                name="cc_pair_name"
+                label="Connector Name"
+                autoCompleteDisabled={true}
+                subtext={`A descriptive name for the connector. This will just be used to identify the connector in the Admin UI.`}
+              />
+            )}
             {formBody && formBody}
             {formBodyBuilder && formBodyBuilder(values)}
             <div className="flex">
diff --git a/web/src/components/admin/connectors/ConnectorTitle.tsx b/web/src/components/admin/connectors/ConnectorTitle.tsx
new file mode 100644
index 000000000..00ea583e6
--- /dev/null
+++ b/web/src/components/admin/connectors/ConnectorTitle.tsx
@@ -0,0 +1,109 @@
+import { getSourceMetadata } from "@/components/source";
+import {
+  ConfluenceConfig,
+  Connector,
+  ConnectorIndexingStatus,
+  GithubConfig,
+  GoogleDriveConfig,
+  JiraConfig,
+  SlackConfig,
+  WebConfig,
+  ZulipConfig,
+} from "@/lib/types";
+
+interface ConnectorTitleProps {
+  connector: Connector<any>;
+  ccPairName: string | null | undefined;
+  isPublic?: boolean;
+  owner?: string;
+  isLink?: boolean;
+  showMetadata?: boolean;
+}
+
+export const ConnectorTitle = ({
+  connector,
+  ccPairName,
+  owner,
+  isPublic = true,
+  isLink = true,
+  showMetadata = true,
+}: ConnectorTitleProps) => {
+  const sourceMetadata = getSourceMetadata(connector.source);
+
+  let additionalMetadata = new Map<string, string>();
+  if (connector.source === "github") {
+    const typedConnector = connector as Connector<GithubConfig>;
+    additionalMetadata.set(
+      "Repo",
+      `${typedConnector.connector_specific_config.repo_owner}/${typedConnector.connector_specific_config.repo_name}`
+    );
+  } else if (connector.source === "confluence") {
+    const typedConnector = connector as Connector<ConfluenceConfig>;
+    additionalMetadata.set(
+      "Wiki URL",
+      typedConnector.connector_specific_config.wiki_page_url
+    );
+  } else if (connector.source === "jira") {
+    const typedConnector = connector as Connector<JiraConfig>;
+    additionalMetadata.set(
+      "Jira Project URL",
+      typedConnector.connector_specific_config.jira_project_url
+    );
+  } else if (connector.source === "google_drive") {
+    const typedConnector = connector as Connector<GoogleDriveConfig>;
+    if (
+      typedConnector.connector_specific_config?.folder_paths &&
+      typedConnector.connector_specific_config?.folder_paths.length > 0
+    ) {
+      additionalMetadata.set(
+        "Folders",
+        typedConnector.connector_specific_config.folder_paths.join(", ")
+      );
+    }
+
+    if (!isPublic && owner) {
+      additionalMetadata.set("Owner", owner);
+    }
+  } else if (connector.source === "slack") {
+    const typedConnector = connector as Connector<SlackConfig>;
+    if (
+      typedConnector.connector_specific_config?.channels &&
+      typedConnector.connector_specific_config?.channels.length > 0
+    ) {
+      additionalMetadata.set(
+        "Channels",
+        typedConnector.connector_specific_config.channels.join(", ")
+      );
+    }
+  } else if (connector.source === "zulip") {
+    const typedConnector = connector as Connector<ZulipConfig>;
+    additionalMetadata.set(
+      "Realm",
+      typedConnector.connector_specific_config.realm_name
+    );
+  }
+  return (
+    <div>
+      <a
+        className="text-blue-500 flex w-fit"
+        href={isLink ? sourceMetadata.adminPageLink : undefined}
+      >
+        {sourceMetadata.icon({ size: 20 })}
+        <div className="ml-1 my-auto">
+          {ccPairName || sourceMetadata.displayName}
+        </div>
+      </a>
+      {showMetadata && (
+        <div className="text-xs text-gray-300 mt-1">
+          {Array.from(additionalMetadata.entries()).map(([key, value]) => {
+            return (
+              <div key={key}>
+                <i>{key}:</i> {value}
+              </div>
+            );
+          })}
+        </div>
+      )}
+    </div>
+  );
+};
diff --git a/web/src/components/admin/connectors/Field.tsx b/web/src/components/admin/connectors/Field.tsx
index 48b47c1b8..dd4d5531d 100644
--- a/web/src/components/admin/connectors/Field.tsx
+++ b/web/src/components/admin/connectors/Field.tsx
@@ -7,26 +7,46 @@ interface TextFormFieldProps {
   name: string;
   label: string;
   subtext?: string;
+  placeholder?: string;
   type?: string;
+  disabled?: boolean;
+  autoCompleteDisabled?: boolean;
 }
 
 export const TextFormField = ({
   name,
   label,
   subtext,
+  placeholder,
   type = "text",
+  disabled = false,
+  autoCompleteDisabled = false,
 }: TextFormFieldProps) => {
   return (
     <div className="mb-4">
       <label htmlFor={name} className="block">
         {label}
       </label>
-      {subtext && <p className="text-xs">{subtext}</p>}
+      {subtext && <p className="text-xs mb-1">{subtext}</p>}
       <Field
         type={type}
         name={name}
         id={name}
-        className="border bg-slate-700 text-gray-200 border-gray-300 rounded w-full py-2 px-3 mt-1"
+        className={
+          `
+          border 
+          text-gray-200 
+          border-gray-300 
+          rounded 
+          w-full 
+          py-2 
+          px-3 
+          mt-1
+        ` + (disabled ? " bg-slate-900" : " bg-slate-700")
+        }
+        disabled={disabled}
+        placeholder={placeholder}
+        autoComplete={autoCompleteDisabled ? "off" : undefined}
       />
       <ErrorMessage
         name={name}
diff --git a/web/src/components/admin/connectors/table/SingleUseConnectorsTable.tsx b/web/src/components/admin/connectors/table/SingleUseConnectorsTable.tsx
index 6875210a7..b447888af 100644
--- a/web/src/components/admin/connectors/table/SingleUseConnectorsTable.tsx
+++ b/web/src/components/admin/connectors/table/SingleUseConnectorsTable.tsx
@@ -83,6 +83,10 @@ export function SingleUseConnectorsTable<
     getCredential !== undefined && onCredentialLink !== undefined;
 
   const columns = [
+    {
+      header: "Name",
+      key: "name",
+    },
     ...(specialColumns ?? []),
     {
       header: "Status",
@@ -127,6 +131,7 @@ export function SingleUseConnectorsTable<
               }
             : { credential: "" };
           return {
+            name: connectorIndexingStatus.name || "",
             status: (
               <SingleUseConnectorStatus
                 indexingStatus={connectorIndexingStatus.last_status}
diff --git a/web/src/components/icons/icons.tsx b/web/src/components/icons/icons.tsx
index f9a250e4d..54a820e2d 100644
--- a/web/src/components/icons/icons.tsx
+++ b/web/src/components/icons/icons.tsx
@@ -31,6 +31,7 @@ import {
   FiAlertTriangle,
   FiZoomIn,
   FiCopy,
+  FiBookmark,
 } from "react-icons/fi";
 import { SiBookstack } from "react-icons/si";
 import Image from "next/image";
@@ -243,6 +244,13 @@ export const CopyIcon = ({
   return <FiCopy size={size} className={className} />;
 };
 
+export const BookmarkIcon = ({
+  size = 16,
+  className = defaultTailwindCSS,
+}: IconProps) => {
+  return <FiBookmark size={size} className={className} />;
+};
+
 //
 //  COMPANY LOGOS
 //
diff --git a/web/src/lib/credential.ts b/web/src/lib/credential.ts
index 043143661..9213194ef 100644
--- a/web/src/lib/credential.ts
+++ b/web/src/lib/credential.ts
@@ -16,18 +16,19 @@ export async function deleteCredential<T>(credentialId: number) {
   });
 }
 
-export async function linkCredential(
+export function linkCredential(
   connectorId: number,
-  credentialId: number
+  credentialId: number,
+  name?: string
 ) {
-  const response = await fetch(
+  return fetch(
     `/api/manage/connector/${connectorId}/credential/${credentialId}`,
     {
       method: "PUT",
       headers: {
         "Content-Type": "application/json",
       },
+      body: JSON.stringify({ name: name || null }),
     }
   );
-  return response.json();
 }
diff --git a/web/src/lib/hooks.ts b/web/src/lib/hooks.ts
index 2ef5b28d7..131fc7e85 100644
--- a/web/src/lib/hooks.ts
+++ b/web/src/lib/hooks.ts
@@ -1,4 +1,8 @@
-import { Credential, DocumentBoostStatus } from "@/lib/types";
+import {
+  ConnectorIndexingStatus,
+  Credential,
+  DocumentBoostStatus,
+} from "@/lib/types";
 import useSWR, { mutate, useSWRConfig } from "swr";
 import { fetcher } from "./fetcher";
 import { useState } from "react";
@@ -46,3 +50,21 @@ export const useObjectState = <T>(
   };
   return [state, set];
 };
+
+const INDEXING_STATUS_URL = "/api/manage/admin/connector/indexing-status";
+
+export const useConnectorCredentialIndexingStatus = (
+  refreshInterval = 30000 // 30 seconds
+) => {
+  const { mutate } = useSWRConfig();
+  const swrResponse = useSWR<ConnectorIndexingStatus<any, any>[]>(
+    INDEXING_STATUS_URL,
+    fetcher,
+    { refreshInterval: refreshInterval }
+  );
+
+  return {
+    ...swrResponse,
+    refreshIndexingStatus: () => mutate(INDEXING_STATUS_URL),
+  };
+};
diff --git a/web/src/lib/types.ts b/web/src/lib/types.ts
index a4035747d..666342e87 100644
--- a/web/src/lib/types.ts
+++ b/web/src/lib/types.ts
@@ -117,6 +117,8 @@ export interface ConnectorIndexingStatus<
   ConnectorConfigType,
   ConnectorCredentialType
 > {
+  cc_pair_id: number;
+  name: string | null;
   connector: Connector<ConnectorConfigType>;
   credential: Credential<ConnectorCredentialType>;
   public_doc: boolean;
@@ -210,3 +212,19 @@ export interface DeletionAttemptSnapshot {
   error_msg?: string;
   num_docs_deleted: number;
 }
+
+// DOCUMENT SETS
+export interface CCPairDescriptor<ConnectorType, CredentialType> {
+  id: number;
+  name: string | null;
+  connector: Connector<ConnectorType>;
+  credential: Credential<CredentialType>;
+}
+
+export interface DocumentSet<ConnectorType, CredentialType> {
+  id: number;
+  name: string;
+  description: string;
+  cc_pair_descriptors: CCPairDescriptor<ConnectorType, CredentialType>[];
+  is_up_to_date: boolean;
+}