mirror of
https://github.com/danswer-ai/danswer.git
synced 2025-03-19 06:12:05 +01:00
61 lines
2.4 KiB
Docker
61 lines
2.4 KiB
Docker
FROM python:3.11.7-slim-bookworm
|
|
|
|
LABEL com.danswer.maintainer="founders@danswer.ai"
|
|
LABEL com.danswer.description="This image is for the Danswer model server which runs all of the \
|
|
AI models for Danswer. This container and all the code is MIT Licensed and free for all to use. \
|
|
You can find it at https://hub.docker.com/r/danswer/danswer-model-server. For more details, \
|
|
visit https://github.com/danswer-ai/danswer."
|
|
|
|
# Default DANSWER_VERSION, typically overriden during builds by GitHub Actions.
|
|
ARG DANSWER_VERSION=0.3-dev
|
|
ENV DANSWER_VERSION=${DANSWER_VERSION} \
|
|
DANSWER_RUNNING_IN_DOCKER="true"
|
|
|
|
|
|
RUN echo "DANSWER_VERSION: ${DANSWER_VERSION}"
|
|
|
|
COPY ./requirements/model_server.txt /tmp/requirements.txt
|
|
RUN pip install --no-cache-dir --upgrade \
|
|
--retries 5 \
|
|
--timeout 30 \
|
|
-r /tmp/requirements.txt
|
|
|
|
RUN apt-get remove -y --allow-remove-essential perl-base && \
|
|
apt-get autoremove -y
|
|
|
|
# Pre-downloading models for setups with limited egress
|
|
# Download tokenizers, distilbert for the Danswer model
|
|
# Download model weights
|
|
# Run Nomic to pull in the custom architecture and have it cached locally
|
|
RUN python -c "from transformers import AutoTokenizer; \
|
|
AutoTokenizer.from_pretrained('distilbert-base-uncased'); \
|
|
AutoTokenizer.from_pretrained('mixedbread-ai/mxbai-rerank-xsmall-v1'); \
|
|
from huggingface_hub import snapshot_download; \
|
|
snapshot_download(repo_id='danswer/hybrid-intent-token-classifier', revision='v1.0.3'); \
|
|
snapshot_download('nomic-ai/nomic-embed-text-v1'); \
|
|
snapshot_download('mixedbread-ai/mxbai-rerank-xsmall-v1'); \
|
|
from sentence_transformers import SentenceTransformer; \
|
|
SentenceTransformer(model_name_or_path='nomic-ai/nomic-embed-text-v1', trust_remote_code=True);"
|
|
|
|
# In case the user has volumes mounted to /root/.cache/huggingface that they've downloaded while
|
|
# running Danswer, don't overwrite it with the built in cache folder
|
|
RUN mv /root/.cache/huggingface /root/.cache/temp_huggingface
|
|
|
|
WORKDIR /app
|
|
|
|
# Utils used by model server
|
|
COPY ./danswer/utils/logger.py /app/danswer/utils/logger.py
|
|
|
|
# Place to fetch version information
|
|
COPY ./danswer/__init__.py /app/danswer/__init__.py
|
|
|
|
# Shared between Danswer Backend and Model Server
|
|
COPY ./shared_configs /app/shared_configs
|
|
|
|
# Model Server main code
|
|
COPY ./model_server /app/model_server
|
|
|
|
ENV PYTHONPATH=/app
|
|
|
|
CMD ["uvicorn", "model_server.main:app", "--host", "0.0.0.0", "--port", "9000"]
|