BasedHardware · beastoin · Jun 14, 2025 · Jun 2, 2025 · Jun 14, 2025 · Jun 14, 2025
diff --git a/backend/charts/deepgram-self-hosted/nova-3/dev_omi_values.yaml b/backend/charts/deepgram-self-hosted/nova-3/dev_omi_values.yaml
@@ -53,29 +53,29 @@ scaling:
           batch:
             requestsPerPod: # Discuss a reasonable value with your Deepgram Account Representative
           streaming:
-            requestsPerPod: 
+            requestsPerPod: 30
         textToSpeech:
           batch:
             requestsPerPod: # Discuss a reasonable value with your Deepgram Account Representative
         # Discuss a reasoanble value with your Deepgram Account Representative
         # Must also set engine.concurrencyLimit.activeRequests if using request ratio for autoscaling
         requestCapacityRatio:
-        custom:
-        - type: External
-          external:
-            metric:
-              name: engine_avg_gpu_utilization
-            target:
-              type: Value
-              value: 70
+        # custom:
+        # - type: External
+        #   external:
+        #     metric:
+        #       name: engine_avg_gpu_utilization
+        #     target:
+        #       type: Value
+        #       value: 70
       behavior:
         scaleUp:
           stabilizationWindowSeconds: 120  # Wait 2 minutes before scaling up
 
 api:
   image:
     path: us-central1-docker.pkg.dev/based-hardware-dev/deepgram/self-hosted-api
-    tag: release-250505
+    tag: release-250610
   affinity:
     nodeAffinity:
       requiredDuringSchedulingIgnoredDuringExecution:
@@ -108,7 +108,7 @@ api:
 engine:
   image:
     path: us-central1-docker.pkg.dev/based-hardware-dev/deepgram/self-hosted-engine
-    tag: release-250505
+    tag: release-250610
   affinity:
     nodeAffinity:
       requiredDuringSchedulingIgnoredDuringExecution:
@@ -144,7 +144,7 @@ licenseProxy:
   enabled: true
   image:
     path: us-central1-docker.pkg.dev/based-hardware-dev/deepgram/self-hosted-license-proxy
-    tag: release-250505
+    tag: release-250610
   affinity:
     nodeAffinity:
       requiredDuringSchedulingIgnoredDuringExecution:

diff --git a/backend/charts/deepgram-self-hosted/nova-3/prod_omi_values.yaml b/backend/charts/deepgram-self-hosted/nova-3/prod_omi_values.yaml
@@ -45,37 +45,37 @@ scaling:
 
     engine:
       # -- Minimum number of Engine replicas.
-      minReplicas: 5
+      minReplicas: 10
       # -- Maximum number of Engine replicas.
       maxReplicas: 20
       metrics:
         speechToText:
           batch:
             requestsPerPod: # Discuss a reasonable value with your Deepgram Account Representative
           streaming:
-            requestsPerPod: 
+            requestsPerPod: 30
         textToSpeech:
           batch:
             requestsPerPod: # Discuss a reasonable value with your Deepgram Account Representative
         # Discuss a reasoanble value with your Deepgram Account Representative
         # Must also set engine.concurrencyLimit.activeRequests if using request ratio for autoscaling
         requestCapacityRatio:
-        custom:
-        - type: External
-          external:
-            metric:
-              name: engine_avg_gpu_utilization
-            target:
-              type: Value
-              value: 60
+        # custom:
+        # - type: External
+        #   external:
+        #     metric:
+        #       name: engine_avg_gpu_utilization
+        #     target:
+        #       type: Value
+        #       value: 60
       behavior:
         scaleUp:
           stabilizationWindowSeconds: 60  # Wait 1 minute before scaling up
 
 api:
   image:
     path: us-central1-docker.pkg.dev/based-hardware/deepgram/self-hosted-api
-    tag: release-250505
+    tag: release-250610
   affinity:
     nodeAffinity:
       requiredDuringSchedulingIgnoredDuringExecution:
@@ -108,7 +108,7 @@ api:
 engine:
   image:
     path: us-central1-docker.pkg.dev/based-hardware/deepgram/self-hosted-engine
-    tag: release-250505
+    tag: release-250610
   affinity:
     nodeAffinity:
       requiredDuringSchedulingIgnoredDuringExecution:
@@ -144,7 +144,7 @@ licenseProxy:
   enabled: true
   image:
     path: us-central1-docker.pkg.dev/based-hardware/deepgram/self-hosted-license-proxy
-    tag: release-250505
+    tag: release-250610
   affinity:
     nodeAffinity:
       requiredDuringSchedulingIgnoredDuringExecution: