From 026652d82741bd15b90e745ac37de8d80a908982 Mon Sep 17 00:00:00 2001 From: Yuhong Sun Date: Sat, 1 Jun 2024 17:29:58 -0700 Subject: [PATCH] Helm tuning (#1553) --- backend/danswer/search/search_nlp_models.py | 1 + deployment/helm/values.yaml | 28 +++++++++---------- .../postgres-service-deployment.yaml | 2 +- .../kubernetes/vespa-service-deployment.yaml | 2 +- 4 files changed, 17 insertions(+), 16 deletions(-) diff --git a/backend/danswer/search/search_nlp_models.py b/backend/danswer/search/search_nlp_models.py index 5243a29c0..761d9aa79 100644 --- a/backend/danswer/search/search_nlp_models.py +++ b/backend/danswer/search/search_nlp_models.py @@ -24,6 +24,7 @@ transformer_logging.set_verbosity_error() os.environ["TOKENIZERS_PARALLELISM"] = "false" os.environ["HF_HUB_DISABLE_TELEMETRY"] = "1" +os.environ["TRANSFORMERS_NO_ADVISORY_WARNINGS"] = "1" logger = setup_logger() diff --git a/deployment/helm/values.yaml b/deployment/helm/values.yaml index 68a477835..19fa2f6e3 100644 --- a/deployment/helm/values.yaml +++ b/deployment/helm/values.yaml @@ -194,17 +194,17 @@ api: type: ClusterIP port: 8080 - resources: + resources: {} # We usually recommend not to specify default resources and to leave this as a conscious # choice for the user. This also increases chances charts run on environments with little # resources, such as Minikube. If you do want to specify resources, uncomment the following # lines, adjust them as necessary, and remove the curly braces after 'resources:'. - requests: - cpu: 500m - memory: 128Mi - limits: - cpu: 900m - memory: 512Mi + # requests: + # cpu: 1000m # Requests 1 CPU core + # memory: 1Gi # Requests 1 GiB of memory + # limits: + # cpu: 2000m # Limits to 2 CPU cores + # memory: 2Gi # Limits to 2 GiB of memory autoscaling: enabled: false @@ -254,17 +254,17 @@ background: # runAsNonRoot: true # runAsUser: 1000 enableMiniChunk: "true" - resources: + resources: {} # We usually recommend not to specify default resources and to leave this as a conscious # choice for the user. This also increases chances charts run on environments with little # resources, such as Minikube. If you do want to specify resources, uncomment the following # lines, adjust them as necessary, and remove the curly braces after 'resources:'. - requests: - cpu: 500m - memory: 500Mi - limits: - cpu: 900m - memory: 800Mi + # requests: + # cpu: 1000m # Requests 1 CPU core + # memory: 1Gi # Requests 1 GiB of memory + # limits: + # cpu: 2000m # Limits to 2 CPU cores + # memory: 2Gi # Limits to 2 GiB of memory autoscaling: enabled: false diff --git a/deployment/kubernetes/postgres-service-deployment.yaml b/deployment/kubernetes/postgres-service-deployment.yaml index f33efa2ba..17330204c 100644 --- a/deployment/kubernetes/postgres-service-deployment.yaml +++ b/deployment/kubernetes/postgres-service-deployment.yaml @@ -54,4 +54,4 @@ spec: resources: requests: # Adjust the storage request size as needed. - storage: 1Gi + storage: 5Gi diff --git a/deployment/kubernetes/vespa-service-deployment.yaml b/deployment/kubernetes/vespa-service-deployment.yaml index 4fa5aa9fa..5016258b7 100644 --- a/deployment/kubernetes/vespa-service-deployment.yaml +++ b/deployment/kubernetes/vespa-service-deployment.yaml @@ -60,4 +60,4 @@ spec: resources: requests: # Adjust the storage request size as needed. - storage: 1Gi + storage: 5Gi