mirror of
https://github.com/danswer-ai/danswer.git
synced 2025-05-04 08:50:24 +02:00
Helm chart refactoring (#3797)
* initial commit for helm chart refactoring * Continue refactoring helm. I was able to use helm to deploy all of the apps to a cluster in aws. The bottleneck was setting up PVC dynamic provisioning. * use default storage class * Fix linter errors * Fix broken helm test --------- Co-authored-by: jpb80 <jordan.buttkevitz@gmail.com>
This commit is contained in:
parent
e061ba2b93
commit
715359c120
22
.github/workflows/pr-helm-chart-testing.yml
vendored
22
.github/workflows/pr-helm-chart-testing.yml
vendored
@ -21,10 +21,10 @@ jobs:
|
|||||||
- name: Set up Helm
|
- name: Set up Helm
|
||||||
uses: azure/setup-helm@v4.2.0
|
uses: azure/setup-helm@v4.2.0
|
||||||
with:
|
with:
|
||||||
version: v3.14.4
|
version: v3.17.0
|
||||||
|
|
||||||
- name: Set up chart-testing
|
- name: Set up chart-testing
|
||||||
uses: helm/chart-testing-action@v2.6.1
|
uses: helm/chart-testing-action@v2.7.0
|
||||||
|
|
||||||
# even though we specify chart-dirs in ct.yaml, it isn't used by ct for the list-changed command...
|
# even though we specify chart-dirs in ct.yaml, it isn't used by ct for the list-changed command...
|
||||||
- name: Run chart-testing (list-changed)
|
- name: Run chart-testing (list-changed)
|
||||||
@ -37,22 +37,6 @@ jobs:
|
|||||||
echo "changed=true" >> "$GITHUB_OUTPUT"
|
echo "changed=true" >> "$GITHUB_OUTPUT"
|
||||||
fi
|
fi
|
||||||
|
|
||||||
# rkuo: I don't think we need python?
|
|
||||||
# - name: Set up Python
|
|
||||||
# uses: actions/setup-python@v5
|
|
||||||
# with:
|
|
||||||
# python-version: '3.11'
|
|
||||||
# cache: 'pip'
|
|
||||||
# cache-dependency-path: |
|
|
||||||
# backend/requirements/default.txt
|
|
||||||
# backend/requirements/dev.txt
|
|
||||||
# backend/requirements/model_server.txt
|
|
||||||
# - run: |
|
|
||||||
# python -m pip install --upgrade pip
|
|
||||||
# pip install --retries 5 --timeout 30 -r backend/requirements/default.txt
|
|
||||||
# pip install --retries 5 --timeout 30 -r backend/requirements/dev.txt
|
|
||||||
# pip install --retries 5 --timeout 30 -r backend/requirements/model_server.txt
|
|
||||||
|
|
||||||
# lint all charts if any changes were detected
|
# lint all charts if any changes were detected
|
||||||
- name: Run chart-testing (lint)
|
- name: Run chart-testing (lint)
|
||||||
if: steps.list-changed.outputs.changed == 'true'
|
if: steps.list-changed.outputs.changed == 'true'
|
||||||
@ -62,7 +46,7 @@ jobs:
|
|||||||
|
|
||||||
- name: Create kind cluster
|
- name: Create kind cluster
|
||||||
if: steps.list-changed.outputs.changed == 'true'
|
if: steps.list-changed.outputs.changed == 'true'
|
||||||
uses: helm/kind-action@v1.10.0
|
uses: helm/kind-action@v1.12.0
|
||||||
|
|
||||||
- name: Run chart-testing (install)
|
- name: Run chart-testing (install)
|
||||||
if: steps.list-changed.outputs.changed == 'true'
|
if: steps.list-changed.outputs.changed == 'true'
|
||||||
|
@ -6,7 +6,7 @@ sources:
|
|||||||
- "https://github.com/onyx-dot-app/onyx"
|
- "https://github.com/onyx-dot-app/onyx"
|
||||||
type: application
|
type: application
|
||||||
version: 0.2.1
|
version: 0.2.1
|
||||||
appVersion: "latest"
|
appVersion: latest
|
||||||
annotations:
|
annotations:
|
||||||
category: Productivity
|
category: Productivity
|
||||||
licenses: MIT
|
licenses: MIT
|
||||||
|
@ -45,10 +45,10 @@ spec:
|
|||||||
- |
|
- |
|
||||||
alembic upgrade head &&
|
alembic upgrade head &&
|
||||||
echo "Starting Onyx Api Server" &&
|
echo "Starting Onyx Api Server" &&
|
||||||
uvicorn onyx.main:app --host 0.0.0.0 --port 8080
|
uvicorn onyx.main:app --host 0.0.0.0 --port {{ .Values.api.containerPorts.server }}
|
||||||
ports:
|
ports:
|
||||||
- name: api-server-port
|
- name: api-server-port
|
||||||
containerPort: {{ .Values.api.service.port }}
|
containerPort: {{ .Values.api.containerPorts.server }}
|
||||||
protocol: TCP
|
protocol: TCP
|
||||||
resources:
|
resources:
|
||||||
{{- toYaml .Values.api.resources | nindent 12 }}
|
{{- toYaml .Values.api.resources | nindent 12 }}
|
||||||
|
@ -11,10 +11,10 @@ metadata:
|
|||||||
spec:
|
spec:
|
||||||
type: {{ .Values.api.service.type }}
|
type: {{ .Values.api.service.type }}
|
||||||
ports:
|
ports:
|
||||||
- port: {{ .Values.api.service.port }}
|
- port: {{ .Values.api.service.servicePort }}
|
||||||
targetPort: api-server-port
|
targetPort: {{ .Values.api.service.targetPort }}
|
||||||
protocol: TCP
|
protocol: TCP
|
||||||
name: api-server-port
|
name: {{ .Values.api.service.portName }}
|
||||||
selector:
|
selector:
|
||||||
{{- include "onyx-stack.selectorLabels" . | nindent 4 }}
|
{{- include "onyx-stack.selectorLabels" . | nindent 4 }}
|
||||||
{{- if .Values.api.deploymentLabels }}
|
{{- if .Values.api.deploymentLabels }}
|
||||||
|
@ -5,7 +5,7 @@ metadata:
|
|||||||
labels:
|
labels:
|
||||||
{{- include "onyx-stack.labels" . | nindent 4 }}
|
{{- include "onyx-stack.labels" . | nindent 4 }}
|
||||||
spec:
|
spec:
|
||||||
replicas: 1
|
replicas: {{ .Values.indexCapability.replicaCount }}
|
||||||
selector:
|
selector:
|
||||||
matchLabels:
|
matchLabels:
|
||||||
{{- include "onyx-stack.selectorLabels" . | nindent 6 }}
|
{{- include "onyx-stack.selectorLabels" . | nindent 6 }}
|
||||||
@ -25,12 +25,14 @@ spec:
|
|||||||
{{- end }}
|
{{- end }}
|
||||||
spec:
|
spec:
|
||||||
containers:
|
containers:
|
||||||
- name: indexing-model-server
|
- name: {{ .Values.indexCapability.name }}
|
||||||
image: onyxdotapp/onyx-model-server:latest
|
image: "{{ .Values.indexCapability.image.repository }}:{{ .Values.indexCapability.image.tag | default .Chart.AppVersion }}"
|
||||||
imagePullPolicy: IfNotPresent
|
imagePullPolicy: {{ .Values.indexCapability.image.pullPolicy }}
|
||||||
command: [ "uvicorn", "model_server.main:app", "--host", "0.0.0.0", "--port", "9000", "--limit-concurrency", "10" ]
|
command: [ "uvicorn", "model_server.main:app", "--host", "0.0.0.0", "--port", "{{ .Values.indexCapability.containerPorts.server }}", "--limit-concurrency", "{{ .Values.indexCapability.limitConcurrency }}" ]
|
||||||
ports:
|
ports:
|
||||||
- containerPort: 9000
|
- name: model-server
|
||||||
|
containerPort: {{ .Values.indexCapability.containerPorts.server }}
|
||||||
|
protocol: TCP
|
||||||
envFrom:
|
envFrom:
|
||||||
- configMapRef:
|
- configMapRef:
|
||||||
name: {{ .Values.config.envConfigMapName }}
|
name: {{ .Values.config.envConfigMapName }}
|
||||||
|
@ -3,6 +3,7 @@ kind: PersistentVolumeClaim
|
|||||||
metadata:
|
metadata:
|
||||||
name: {{ .Values.indexCapability.indexingModelPVC.name }}
|
name: {{ .Values.indexCapability.indexingModelPVC.name }}
|
||||||
spec:
|
spec:
|
||||||
|
storageClassName: {{ .Values.persistent.storageClassName }}
|
||||||
accessModes:
|
accessModes:
|
||||||
- {{ .Values.indexCapability.indexingModelPVC.accessMode | quote }}
|
- {{ .Values.indexCapability.indexingModelPVC.accessMode | quote }}
|
||||||
resources:
|
resources:
|
||||||
|
@ -11,8 +11,8 @@ spec:
|
|||||||
{{- toYaml .Values.indexCapability.deploymentLabels | nindent 4 }}
|
{{- toYaml .Values.indexCapability.deploymentLabels | nindent 4 }}
|
||||||
{{- end }}
|
{{- end }}
|
||||||
ports:
|
ports:
|
||||||
- name: {{ .Values.indexCapability.service.name }}
|
- name: {{ .Values.indexCapability.service.portName }}
|
||||||
protocol: TCP
|
protocol: TCP
|
||||||
port: {{ .Values.indexCapability.service.port }}
|
port: {{ .Values.indexCapability.service.servicePort }}
|
||||||
targetPort: {{ .Values.indexCapability.service.port }}
|
targetPort: {{ .Values.indexCapability.service.targetPort }}
|
||||||
type: {{ .Values.indexCapability.service.type }}
|
type: {{ .Values.indexCapability.service.type }}
|
@ -3,14 +3,14 @@ kind: Deployment
|
|||||||
metadata:
|
metadata:
|
||||||
name: {{ include "onyx-stack.fullname" . }}-inference-model
|
name: {{ include "onyx-stack.fullname" . }}-inference-model
|
||||||
labels:
|
labels:
|
||||||
{{- range .Values.inferenceCapability.deployment.labels }}
|
{{- range .Values.inferenceCapability.labels }}
|
||||||
{{ .key }}: {{ .value }}
|
{{ .key }}: {{ .value }}
|
||||||
{{- end }}
|
{{- end }}
|
||||||
spec:
|
spec:
|
||||||
replicas: {{ .Values.inferenceCapability.deployment.replicas }}
|
replicas: {{ .Values.inferenceCapability.replicaCount }}
|
||||||
selector:
|
selector:
|
||||||
matchLabels:
|
matchLabels:
|
||||||
{{- range .Values.inferenceCapability.deployment.labels }}
|
{{- range .Values.inferenceCapability.labels }}
|
||||||
{{ .key }}: {{ .value }}
|
{{ .key }}: {{ .value }}
|
||||||
{{- end }}
|
{{- end }}
|
||||||
template:
|
template:
|
||||||
@ -21,24 +21,26 @@ spec:
|
|||||||
{{- end }}
|
{{- end }}
|
||||||
spec:
|
spec:
|
||||||
containers:
|
containers:
|
||||||
- name: {{ .Values.inferenceCapability.service.name }}
|
- name: model-server-inference
|
||||||
image: {{ .Values.inferenceCapability.deployment.image.repository }}:{{ .Values.inferenceCapability.deployment.image.tag }}
|
image: "{{ .Values.inferenceCapability.image.repository }}:{{ .Values.inferenceCapability.image.tag | default .Chart.AppVersion }}"
|
||||||
imagePullPolicy: {{ .Values.inferenceCapability.deployment.image.pullPolicy }}
|
imagePullPolicy: {{ .Values.inferenceCapability.image.pullPolicy }}
|
||||||
command: {{ toYaml .Values.inferenceCapability.deployment.command | nindent 14 }}
|
command: [ "uvicorn", "model_server.main:app", "--host", "0.0.0.0", "--port", "{{ .Values.inferenceCapability.containerPorts.server }}" ]
|
||||||
ports:
|
ports:
|
||||||
- containerPort: {{ .Values.inferenceCapability.service.port }}
|
- name: model-server
|
||||||
|
containerPort: {{ .Values.inferenceCapability.containerPorts.server }}
|
||||||
|
protocol: TCP
|
||||||
envFrom:
|
envFrom:
|
||||||
- configMapRef:
|
- configMapRef:
|
||||||
name: {{ .Values.config.envConfigMapName }}
|
name: {{ .Values.config.envConfigMapName }}
|
||||||
env:
|
env:
|
||||||
{{- include "onyx-stack.envSecrets" . | nindent 12}}
|
{{- include "onyx-stack.envSecrets" . | nindent 12}}
|
||||||
volumeMounts:
|
volumeMounts:
|
||||||
{{- range .Values.inferenceCapability.deployment.volumeMounts }}
|
{{- range .Values.inferenceCapability.volumeMounts }}
|
||||||
- name: {{ .name }}
|
- name: {{ .name }}
|
||||||
mountPath: {{ .mountPath }}
|
mountPath: {{ .mountPath }}
|
||||||
{{- end }}
|
{{- end }}
|
||||||
volumes:
|
volumes:
|
||||||
{{- range .Values.inferenceCapability.deployment.volumes }}
|
{{- range .Values.inferenceCapability.volumes }}
|
||||||
- name: {{ .name }}
|
- name: {{ .name }}
|
||||||
persistentVolumeClaim:
|
persistentVolumeClaim:
|
||||||
claimName: {{ .persistentVolumeClaim.claimName }}
|
claimName: {{ .persistentVolumeClaim.claimName }}
|
||||||
|
@ -3,6 +3,7 @@ kind: PersistentVolumeClaim
|
|||||||
metadata:
|
metadata:
|
||||||
name: {{ .Values.inferenceCapability.pvc.name }}
|
name: {{ .Values.inferenceCapability.pvc.name }}
|
||||||
spec:
|
spec:
|
||||||
|
storageClassName: {{ .Values.persistent.storageClassName }}
|
||||||
accessModes:
|
accessModes:
|
||||||
{{- toYaml .Values.inferenceCapability.pvc.accessModes | nindent 4 }}
|
{{- toYaml .Values.inferenceCapability.pvc.accessModes | nindent 4 }}
|
||||||
resources:
|
resources:
|
||||||
|
@ -5,11 +5,11 @@ metadata:
|
|||||||
spec:
|
spec:
|
||||||
type: {{ .Values.inferenceCapability.service.type }}
|
type: {{ .Values.inferenceCapability.service.type }}
|
||||||
ports:
|
ports:
|
||||||
- port: {{ .Values.inferenceCapability.service.port }}
|
- port: {{ .Values.inferenceCapability.service.servicePort}}
|
||||||
targetPort: {{ .Values.inferenceCapability.service.port }}
|
targetPort: {{ .Values.inferenceCapability.service.targetPort }}
|
||||||
protocol: TCP
|
protocol: TCP
|
||||||
name: {{ .Values.inferenceCapability.service.name }}
|
name: {{ .Values.inferenceCapability.service.portName }}
|
||||||
selector:
|
selector:
|
||||||
{{- range .Values.inferenceCapability.deployment.labels }}
|
{{- range .Values.inferenceCapability.labels }}
|
||||||
{{ .key }}: {{ .value }}
|
{{ .key }}: {{ .value }}
|
||||||
{{- end }}
|
{{- end }}
|
||||||
|
@ -5,11 +5,11 @@ metadata:
|
|||||||
data:
|
data:
|
||||||
nginx.conf: |
|
nginx.conf: |
|
||||||
upstream api_server {
|
upstream api_server {
|
||||||
server {{ include "onyx-stack.fullname" . }}-api-service:{{ .Values.api.service.port }} fail_timeout=0;
|
server {{ include "onyx-stack.fullname" . }}-api-service:{{ .Values.api.service.servicePort }} fail_timeout=0;
|
||||||
}
|
}
|
||||||
|
|
||||||
upstream web_server {
|
upstream web_server {
|
||||||
server {{ include "onyx-stack.fullname" . }}-webserver:{{ .Values.webserver.service.port }} fail_timeout=0;
|
server {{ include "onyx-stack.fullname" . }}-webserver:{{ .Values.webserver.service.servicePort }} fail_timeout=0;
|
||||||
}
|
}
|
||||||
|
|
||||||
server {
|
server {
|
||||||
|
@ -11,5 +11,5 @@ spec:
|
|||||||
- name: wget
|
- name: wget
|
||||||
image: busybox
|
image: busybox
|
||||||
command: ['wget']
|
command: ['wget']
|
||||||
args: ['{{ include "onyx-stack.fullname" . }}-webserver:{{ .Values.webserver.service.port }}']
|
args: ['{{ include "onyx-stack.fullname" . }}-webserver:{{ .Values.webserver.service.servicePort }}']
|
||||||
restartPolicy: Never
|
restartPolicy: Never
|
||||||
|
@ -41,7 +41,7 @@ spec:
|
|||||||
imagePullPolicy: {{ .Values.webserver.image.pullPolicy }}
|
imagePullPolicy: {{ .Values.webserver.image.pullPolicy }}
|
||||||
ports:
|
ports:
|
||||||
- name: http
|
- name: http
|
||||||
containerPort: {{ .Values.webserver.service.port }}
|
containerPort: {{ .Values.webserver.containerPorts.server }}
|
||||||
protocol: TCP
|
protocol: TCP
|
||||||
resources:
|
resources:
|
||||||
{{- toYaml .Values.webserver.resources | nindent 12 }}
|
{{- toYaml .Values.webserver.resources | nindent 12 }}
|
||||||
|
@ -10,8 +10,8 @@ metadata:
|
|||||||
spec:
|
spec:
|
||||||
type: {{ .Values.webserver.service.type }}
|
type: {{ .Values.webserver.service.type }}
|
||||||
ports:
|
ports:
|
||||||
- port: {{ .Values.webserver.service.port }}
|
- port: {{ .Values.webserver.service.servicePort }}
|
||||||
targetPort: http
|
targetPort: {{ .Values.webserver.service.targetPort }}
|
||||||
protocol: TCP
|
protocol: TCP
|
||||||
name: http
|
name: http
|
||||||
selector:
|
selector:
|
||||||
|
@ -2,40 +2,46 @@
|
|||||||
# This is a YAML-formatted file.
|
# This is a YAML-formatted file.
|
||||||
# Declare variables to be passed into your templates.
|
# Declare variables to be passed into your templates.
|
||||||
|
|
||||||
|
postgresql:
|
||||||
|
primary:
|
||||||
|
persistence:
|
||||||
|
size: 5Gi
|
||||||
|
enabled: true
|
||||||
|
auth:
|
||||||
|
existingSecret: onyx-secrets
|
||||||
|
secretKeys:
|
||||||
|
# overwriting as postgres typically expects 'postgres-password'
|
||||||
|
adminPasswordKey: postgres_password
|
||||||
imagePullSecrets: []
|
imagePullSecrets: []
|
||||||
nameOverride: ""
|
nameOverride: ""
|
||||||
fullnameOverride: ""
|
fullnameOverride: ""
|
||||||
|
|
||||||
|
persistent:
|
||||||
|
storageClassName: ""
|
||||||
|
|
||||||
inferenceCapability:
|
inferenceCapability:
|
||||||
service:
|
service:
|
||||||
name: inference-model-server-service
|
portName: modelserver
|
||||||
type: ClusterIP
|
type: ClusterIP
|
||||||
port: 9000
|
servicePort: 9000
|
||||||
|
targetPort: 9000
|
||||||
pvc:
|
pvc:
|
||||||
name: inference-model-pvc
|
name: inference-model-pvc
|
||||||
accessModes:
|
accessModes:
|
||||||
- ReadWriteOnce
|
- ReadWriteOnce
|
||||||
storage: 3Gi
|
storage: 3Gi
|
||||||
deployment:
|
name: inference-model-server
|
||||||
name: inference-model-server-deployment
|
replicaCount: 1
|
||||||
replicas: 1
|
|
||||||
labels:
|
labels:
|
||||||
- key: app
|
- key: app
|
||||||
value: inference-model-server
|
value: inference-model-server
|
||||||
image:
|
image:
|
||||||
repository: onyxdotapp/onyx-model-server
|
repository: onyxdotapp/onyx-model-server
|
||||||
tag: latest
|
# Overrides the image tag whose default is the chart appVersion.
|
||||||
|
tag: ""
|
||||||
pullPolicy: IfNotPresent
|
pullPolicy: IfNotPresent
|
||||||
command:
|
containerPorts:
|
||||||
[
|
server: 9000
|
||||||
"uvicorn",
|
|
||||||
"model_server.main:app",
|
|
||||||
"--host",
|
|
||||||
"0.0.0.0",
|
|
||||||
"--port",
|
|
||||||
"9000",
|
|
||||||
]
|
|
||||||
port: 9000
|
|
||||||
volumeMounts:
|
volumeMounts:
|
||||||
- name: inference-model-storage
|
- name: inference-model-storage
|
||||||
mountPath: /root/.cache
|
mountPath: /root/.cache
|
||||||
@ -49,15 +55,20 @@ inferenceCapability:
|
|||||||
|
|
||||||
indexCapability:
|
indexCapability:
|
||||||
service:
|
service:
|
||||||
|
portName: modelserver
|
||||||
type: ClusterIP
|
type: ClusterIP
|
||||||
port: 9000
|
servicePort: 9000
|
||||||
name: indexing-model-server-port
|
targetPort: 9000
|
||||||
|
replicaCount: 1
|
||||||
|
name: indexing-model-server
|
||||||
deploymentLabels:
|
deploymentLabels:
|
||||||
app: indexing-model-server
|
app: indexing-model-server
|
||||||
podLabels:
|
podLabels:
|
||||||
app: indexing-model-server
|
app: indexing-model-server
|
||||||
indexingOnly: "True"
|
indexingOnly: "True"
|
||||||
podAnnotations: {}
|
podAnnotations: {}
|
||||||
|
containerPorts:
|
||||||
|
server: 9000
|
||||||
volumeMounts:
|
volumeMounts:
|
||||||
- name: indexing-model-storage
|
- name: indexing-model-storage
|
||||||
mountPath: /root/.cache
|
mountPath: /root/.cache
|
||||||
@ -69,7 +80,12 @@ indexCapability:
|
|||||||
name: indexing-model-storage
|
name: indexing-model-storage
|
||||||
accessMode: "ReadWriteOnce"
|
accessMode: "ReadWriteOnce"
|
||||||
storage: "3Gi"
|
storage: "3Gi"
|
||||||
|
image:
|
||||||
|
repository: onyxdotapp/onyx-model-server
|
||||||
|
# Overrides the image tag whose default is the chart appVersion.
|
||||||
|
tag: ""
|
||||||
|
pullPolicy: IfNotPresent
|
||||||
|
limitConcurrency: 10
|
||||||
config:
|
config:
|
||||||
envConfigMapName: env-configmap
|
envConfigMapName: env-configmap
|
||||||
|
|
||||||
@ -84,16 +100,6 @@ serviceAccount:
|
|||||||
# If not set and create is true, a name is generated using the fullname template
|
# If not set and create is true, a name is generated using the fullname template
|
||||||
name: ""
|
name: ""
|
||||||
|
|
||||||
postgresql:
|
|
||||||
primary:
|
|
||||||
persistence:
|
|
||||||
size: 5Gi
|
|
||||||
enabled: true
|
|
||||||
auth:
|
|
||||||
existingSecret: onyx-secrets
|
|
||||||
secretKeys:
|
|
||||||
adminPasswordKey: postgres_password # overwriting as postgres typically expects 'postgres-password'
|
|
||||||
|
|
||||||
nginx:
|
nginx:
|
||||||
containerPorts:
|
containerPorts:
|
||||||
http: 1024
|
http: 1024
|
||||||
@ -135,9 +141,13 @@ webserver:
|
|||||||
# runAsNonRoot: true
|
# runAsNonRoot: true
|
||||||
# runAsUser: 1000
|
# runAsUser: 1000
|
||||||
|
|
||||||
|
containerPorts:
|
||||||
|
server: 3000
|
||||||
|
|
||||||
service:
|
service:
|
||||||
type: ClusterIP
|
type: ClusterIP
|
||||||
port: 3000
|
servicePort: 3000
|
||||||
|
targetPort: http
|
||||||
|
|
||||||
resources: {}
|
resources: {}
|
||||||
# We usually recommend not to specify default resources and to leave this as a conscious
|
# We usually recommend not to specify default resources and to leave this as a conscious
|
||||||
@ -156,7 +166,7 @@ webserver:
|
|||||||
minReplicas: 1
|
minReplicas: 1
|
||||||
maxReplicas: 100
|
maxReplicas: 100
|
||||||
targetCPUUtilizationPercentage: 80
|
targetCPUUtilizationPercentage: 80
|
||||||
# targetMemoryUtilizationPercentage: 80
|
targetMemoryUtilizationPercentage: 80
|
||||||
|
|
||||||
# Additional volumes on the output Deployment definition.
|
# Additional volumes on the output Deployment definition.
|
||||||
volumes: []
|
volumes: []
|
||||||
@ -189,6 +199,9 @@ api:
|
|||||||
scope: onyx-backend
|
scope: onyx-backend
|
||||||
app: api-server
|
app: api-server
|
||||||
|
|
||||||
|
containerPorts:
|
||||||
|
server: 8080
|
||||||
|
|
||||||
podSecurityContext:
|
podSecurityContext:
|
||||||
{}
|
{}
|
||||||
# fsGroup: 2000
|
# fsGroup: 2000
|
||||||
@ -204,7 +217,9 @@ api:
|
|||||||
|
|
||||||
service:
|
service:
|
||||||
type: ClusterIP
|
type: ClusterIP
|
||||||
port: 8080
|
servicePort: 8080
|
||||||
|
targetPort: api-server-port
|
||||||
|
portName: api-server-port
|
||||||
|
|
||||||
resources: {}
|
resources: {}
|
||||||
# We usually recommend not to specify default resources and to leave this as a conscious
|
# We usually recommend not to specify default resources and to leave this as a conscious
|
||||||
@ -223,7 +238,7 @@ api:
|
|||||||
minReplicas: 1
|
minReplicas: 1
|
||||||
maxReplicas: 100
|
maxReplicas: 100
|
||||||
targetCPUUtilizationPercentage: 80
|
targetCPUUtilizationPercentage: 80
|
||||||
# targetMemoryUtilizationPercentage: 80
|
targetMemoryUtilizationPercentage: 80
|
||||||
|
|
||||||
# Additional volumes on the output Deployment definition.
|
# Additional volumes on the output Deployment definition.
|
||||||
volumes: []
|
volumes: []
|
||||||
@ -247,7 +262,7 @@ background:
|
|||||||
repository: onyxdotapp/onyx-backend
|
repository: onyxdotapp/onyx-backend
|
||||||
pullPolicy: IfNotPresent
|
pullPolicy: IfNotPresent
|
||||||
# Overrides the image tag whose default is the chart appVersion.
|
# Overrides the image tag whose default is the chart appVersion.
|
||||||
tag: latest
|
tag: ""
|
||||||
podAnnotations: {}
|
podAnnotations: {}
|
||||||
podLabels:
|
podLabels:
|
||||||
scope: onyx-backend
|
scope: onyx-backend
|
||||||
@ -284,7 +299,7 @@ background:
|
|||||||
minReplicas: 1
|
minReplicas: 1
|
||||||
maxReplicas: 100
|
maxReplicas: 100
|
||||||
targetCPUUtilizationPercentage: 80
|
targetCPUUtilizationPercentage: 80
|
||||||
# targetMemoryUtilizationPercentage: 80
|
targetMemoryUtilizationPercentage: 80
|
||||||
|
|
||||||
# Additional volumes on the output Deployment definition.
|
# Additional volumes on the output Deployment definition.
|
||||||
volumes: []
|
volumes: []
|
||||||
@ -303,6 +318,16 @@ background:
|
|||||||
tolerations: []
|
tolerations: []
|
||||||
|
|
||||||
vespa:
|
vespa:
|
||||||
|
volumeClaimTemplates:
|
||||||
|
- metadata:
|
||||||
|
name: vespa-storage
|
||||||
|
spec:
|
||||||
|
accessModes:
|
||||||
|
- ReadWriteOnce
|
||||||
|
storageClassName: ""
|
||||||
|
resources:
|
||||||
|
requests:
|
||||||
|
storage: 1Gi
|
||||||
enabled: true
|
enabled: true
|
||||||
replicaCount: 1
|
replicaCount: 1
|
||||||
image:
|
image:
|
||||||
@ -377,19 +402,11 @@ redis:
|
|||||||
# # hosts:
|
# # hosts:
|
||||||
# # - chart-example.local
|
# # - chart-example.local
|
||||||
|
|
||||||
persistence:
|
|
||||||
vespa:
|
|
||||||
enabled: true
|
|
||||||
existingClaim: ""
|
|
||||||
storageClassName: ""
|
|
||||||
accessModes:
|
|
||||||
- ReadWriteOnce
|
|
||||||
size: 5Gi
|
|
||||||
|
|
||||||
auth:
|
auth:
|
||||||
# for storing smtp, oauth, slack, and other secrets
|
# existingSecret onyx-secret for storing smtp, oauth, slack, and other secrets
|
||||||
# keys are lowercased version of env vars (e.g. SMTP_USER -> smtp_user)
|
# keys are lowercased version of env vars (e.g. SMTP_USER -> smtp_user)
|
||||||
existingSecret: "" # onyx-secrets
|
existingSecret: ""
|
||||||
# optionally override the secret keys to reference in the secret
|
# optionally override the secret keys to reference in the secret
|
||||||
# this is used to populate the env vars in individual deployments
|
# this is used to populate the env vars in individual deployments
|
||||||
# the values here reference the keys in secrets below
|
# the values here reference the keys in secrets below
|
||||||
@ -413,14 +430,22 @@ auth:
|
|||||||
redis_password: "password"
|
redis_password: "password"
|
||||||
|
|
||||||
configMap:
|
configMap:
|
||||||
AUTH_TYPE: "disabled" # Change this for production uses unless Onyx is only accessible behind VPN
|
# Change this for production uses unless Onyx is only accessible behind VPN
|
||||||
SESSION_EXPIRE_TIME_SECONDS: "86400" # 1 Day Default
|
AUTH_TYPE: "disabled"
|
||||||
VALID_EMAIL_DOMAINS: "" # Can be something like onyx.app, as an extra double-check
|
# 1 Day Default
|
||||||
SMTP_SERVER: "" # For sending verification emails, if unspecified then defaults to 'smtp.gmail.com'
|
SESSION_EXPIRE_TIME_SECONDS: "86400"
|
||||||
SMTP_PORT: "" # For sending verification emails, if unspecified then defaults to '587'
|
# Can be something like onyx.app, as an extra double-check
|
||||||
SMTP_USER: "" # 'your-email@company.com'
|
VALID_EMAIL_DOMAINS: ""
|
||||||
# SMTP_PASS: "" # 'your-gmail-password'
|
# For sending verification emails, if unspecified then defaults to 'smtp.gmail.com'
|
||||||
EMAIL_FROM: "" # 'your-email@company.com' SMTP_USER missing used instead
|
SMTP_SERVER: ""
|
||||||
|
# For sending verification emails, if unspecified then defaults to '587'
|
||||||
|
SMTP_PORT: ""
|
||||||
|
# 'your-email@company.com'
|
||||||
|
SMTP_USER: ""
|
||||||
|
# 'your-gmail-password'
|
||||||
|
# SMTP_PASS: ""
|
||||||
|
# 'your-email@company.com' SMTP_USER missing used instead
|
||||||
|
EMAIL_FROM: ""
|
||||||
# Gen AI Settings
|
# Gen AI Settings
|
||||||
GEN_AI_MAX_TOKENS: ""
|
GEN_AI_MAX_TOKENS: ""
|
||||||
QA_TIMEOUT: "60"
|
QA_TIMEOUT: "60"
|
||||||
@ -462,7 +487,7 @@ configMap:
|
|||||||
DANSWER_BOT_DISABLE_DOCS_ONLY_ANSWER: ""
|
DANSWER_BOT_DISABLE_DOCS_ONLY_ANSWER: ""
|
||||||
DANSWER_BOT_DISPLAY_ERROR_MSGS: ""
|
DANSWER_BOT_DISPLAY_ERROR_MSGS: ""
|
||||||
DANSWER_BOT_RESPOND_EVERY_CHANNEL: ""
|
DANSWER_BOT_RESPOND_EVERY_CHANNEL: ""
|
||||||
DANSWER_BOT_DISABLE_COT: "" # Currently unused
|
DANSWER_BOT_DISABLE_COT: ""
|
||||||
NOTIFY_SLACKBOT_NO_ANSWER: ""
|
NOTIFY_SLACKBOT_NO_ANSWER: ""
|
||||||
# Logging
|
# Logging
|
||||||
# Optional Telemetry, please keep it on (nothing sensitive is collected)? <3
|
# Optional Telemetry, please keep it on (nothing sensitive is collected)? <3
|
||||||
@ -473,7 +498,8 @@ configMap:
|
|||||||
LOG_DANSWER_MODEL_INTERACTIONS: ""
|
LOG_DANSWER_MODEL_INTERACTIONS: ""
|
||||||
LOG_VESPA_TIMING_INFORMATION: ""
|
LOG_VESPA_TIMING_INFORMATION: ""
|
||||||
# Shared or Non-backend Related
|
# Shared or Non-backend Related
|
||||||
WEB_DOMAIN: "http://localhost:3000" # for web server and api server
|
WEB_DOMAIN: "http://localhost:3000"
|
||||||
DOMAIN: "localhost" # for nginx
|
# DOMAIN used by nginx
|
||||||
|
DOMAIN: "localhost"
|
||||||
# Chat Configs
|
# Chat Configs
|
||||||
HARD_DELETE_CHATS: ""
|
HARD_DELETE_CHATS: ""
|
||||||
|
Loading…
x
Reference in New Issue
Block a user