From 026652d82741bd15b90e745ac37de8d80a908982 Mon Sep 17 00:00:00 2001
From: Yuhong Sun <yuhongsun96@gmail.com>
Date: Sat, 1 Jun 2024 17:29:58 -0700
Subject: [PATCH] Helm tuning (#1553)

---
 backend/danswer/search/search_nlp_models.py   |  1 +
 deployment/helm/values.yaml                   | 28 +++++++++----------
 .../postgres-service-deployment.yaml          |  2 +-
 .../kubernetes/vespa-service-deployment.yaml  |  2 +-
 4 files changed, 17 insertions(+), 16 deletions(-)

diff --git a/backend/danswer/search/search_nlp_models.py b/backend/danswer/search/search_nlp_models.py
index 5243a29c0..761d9aa79 100644
--- a/backend/danswer/search/search_nlp_models.py
+++ b/backend/danswer/search/search_nlp_models.py
@@ -24,6 +24,7 @@ transformer_logging.set_verbosity_error()
 
 os.environ["TOKENIZERS_PARALLELISM"] = "false"
 os.environ["HF_HUB_DISABLE_TELEMETRY"] = "1"
+os.environ["TRANSFORMERS_NO_ADVISORY_WARNINGS"] = "1"
 
 logger = setup_logger()
 
diff --git a/deployment/helm/values.yaml b/deployment/helm/values.yaml
index 68a477835..19fa2f6e3 100644
--- a/deployment/helm/values.yaml
+++ b/deployment/helm/values.yaml
@@ -194,17 +194,17 @@ api:
     type: ClusterIP
     port: 8080
 
-  resources:
+  resources: {}
   # We usually recommend not to specify default resources and to leave this as a conscious
   # choice for the user. This also increases chances charts run on environments with little
   # resources, such as Minikube. If you do want to specify resources, uncomment the following
   # lines, adjust them as necessary, and remove the curly braces after 'resources:'.
-    requests:
-      cpu: 500m
-      memory: 128Mi
-    limits:
-      cpu: 900m
-      memory: 512Mi
+  #  requests:
+  #    cpu: 1000m  # Requests 1 CPU core
+  #    memory: 1Gi  # Requests 1 GiB of memory
+  #  limits:
+  #    cpu: 2000m  # Limits to 2 CPU cores
+  #    memory: 2Gi  # Limits to 2 GiB of memory
 
   autoscaling:
     enabled: false
@@ -254,17 +254,17 @@ background:
     # runAsNonRoot: true
     # runAsUser: 1000
   enableMiniChunk: "true"
-  resources:
+  resources: {}
   # We usually recommend not to specify default resources and to leave this as a conscious
   # choice for the user. This also increases chances charts run on environments with little
   # resources, such as Minikube. If you do want to specify resources, uncomment the following
   # lines, adjust them as necessary, and remove the curly braces after 'resources:'.
-    requests:
-      cpu: 500m
-      memory: 500Mi
-    limits:
-      cpu: 900m
-      memory: 800Mi
+  #  requests:
+  #    cpu: 1000m  # Requests 1 CPU core
+  #    memory: 1Gi  # Requests 1 GiB of memory
+  #  limits:
+  #    cpu: 2000m  # Limits to 2 CPU cores
+  #    memory: 2Gi  # Limits to 2 GiB of memory
 
   autoscaling:
     enabled: false
diff --git a/deployment/kubernetes/postgres-service-deployment.yaml b/deployment/kubernetes/postgres-service-deployment.yaml
index f33efa2ba..17330204c 100644
--- a/deployment/kubernetes/postgres-service-deployment.yaml
+++ b/deployment/kubernetes/postgres-service-deployment.yaml
@@ -54,4 +54,4 @@ spec:
       resources:
         requests:
           # Adjust the storage request size as needed.
-          storage: 1Gi
+          storage: 5Gi
diff --git a/deployment/kubernetes/vespa-service-deployment.yaml b/deployment/kubernetes/vespa-service-deployment.yaml
index 4fa5aa9fa..5016258b7 100644
--- a/deployment/kubernetes/vespa-service-deployment.yaml
+++ b/deployment/kubernetes/vespa-service-deployment.yaml
@@ -60,4 +60,4 @@ spec:
       resources:
         requests:
           # Adjust the storage request size as needed.
-          storage: 1Gi
+          storage: 5Gi