From cd09206a901a4db7a839ccf709d98bdb72f2fbb6 Mon Sep 17 00:00:00 2001
From: Julia Kroll <135150417+jkroll-deepgram@users.noreply.github.com>
Date: Thu, 24 Oct 2024 15:37:13 -0500
Subject: [PATCH] October 2024 release (241024) (#47)

---
 charts/deepgram-self-hosted/CHANGELOG.md               | 10 +++++++++-
 charts/deepgram-self-hosted/Chart.yaml                 |  4 ++--
 charts/deepgram-self-hosted/README.md                  |  8 ++++----
 .../deepgram-self-hosted/templates/api/api.config.yaml |  1 +
 charts/deepgram-self-hosted/values.yaml                |  6 +++---
 common/license_proxy_deploy/api.toml                   |  2 ++
 common/standard_deploy/api.toml                        |  2 ++
 docker/docker-compose.license-proxy.yml                |  6 +++---
 docker/docker-compose.standard.yml                     |  4 ++--
 podman/podman-compose.license-proxy.yml                |  6 +++---
 podman/podman-compose.standard.yml                     |  4 ++--
 11 files changed, 33 insertions(+), 20 deletions(-)

diff --git a/charts/deepgram-self-hosted/CHANGELOG.md b/charts/deepgram-self-hosted/CHANGELOG.md
index 684f19b..015ac37 100644
--- a/charts/deepgram-self-hosted/CHANGELOG.md
+++ b/charts/deepgram-self-hosted/CHANGELOG.md
@@ -6,6 +6,13 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 
 ## [Unreleased]
 
+## [0.7.0] - 2024-10-24
+
+### Added
+
+- Updated default container tags to October 2024 release. Refer to the [main Deepgram changelog](https://deepgram.com/changelog/deepgram-self-hosted-october-2024-release-241024) for additional details. Highlights include:
+  - Adds new [streaming websocket TTS](https://deepgram.com/changelog/websocket-text-to-speech-api)! This is a software feature, so no new TTS models are required.
+
 ### Changed
 
 - AWS samples updated to take advantage of new [EKS accelerated AMIs](https://aws.amazon.com/about-aws/whats-new/2024/10/amazon-eks-nvidia-aws-neuron-instance-types-al2023/), which bundle the required NVIDIA driver and toolkit instead of being installed by the NVIDIA GPU operator 
@@ -124,7 +131,8 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 - Initial implementation of the Helm chart.
 
 
-[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.6.0...HEAD
+[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.7.0...HEAD
+[0.7.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.6.0...deepgram-self-hosted-0.7.0
 [0.6.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.5.0...deepgram-self-hosted-0.6.0
 [0.5.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.4.0...deepgram-self-hosted-0.5.0
 [0.4.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.3.0...deepgram-self-hosted-0.4.0
diff --git a/charts/deepgram-self-hosted/Chart.yaml b/charts/deepgram-self-hosted/Chart.yaml
index e14218f..7290155 100644
--- a/charts/deepgram-self-hosted/Chart.yaml
+++ b/charts/deepgram-self-hosted/Chart.yaml
@@ -1,8 +1,8 @@
 apiVersion: v2
 name: deepgram-self-hosted
 type: application
-version: 0.6.0
-appVersion: "release-240927"
+version: 0.7.0
+appVersion: "release-241024"
 description: A Helm chart for running Deepgram services in a self-hosted environment
 home: "https://developers.deepgram.com/docs/self-hosted-introduction"
 sources: ["https://github.com/deepgram/self-hosted-resources"]
diff --git a/charts/deepgram-self-hosted/README.md b/charts/deepgram-self-hosted/README.md
index d04c681..5a5e2e1 100644
--- a/charts/deepgram-self-hosted/README.md
+++ b/charts/deepgram-self-hosted/README.md
@@ -1,6 +1,6 @@
 # deepgram-self-hosted
 
-![Version: 0.6.0](https://img.shields.io/badge/Version-0.6.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-240927](https://img.shields.io/badge/AppVersion-release--240927-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted)
+![Version: 0.7.0](https://img.shields.io/badge/Version-0.7.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-241024](https://img.shields.io/badge/AppVersion-release--241024-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted)
 
 A Helm chart for running Deepgram services in a self-hosted environment
 
@@ -192,7 +192,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin
 | api.features.entityRedaction | bool | `false` | Enables entity-based redaction on pre-recorded audio *if* a valid entity detection model is available. *WARNING*: Beta functionality. |
 | api.image.path | string | `"quay.io/deepgram/self-hosted-api"` | path configures the image path to use for creating API containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. |
 | api.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram API image |
-| api.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for API containers |
+| api.image.tag | string | `"release-241024"` | tag defines which Deepgram release to use for API containers |
 | api.livenessProbe | object | `` | Liveness probe customization for API pods. |
 | api.namePrefix | string | `"deepgram-api"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram API containers. |
 | api.readinessProbe | object | `` | Readiness probe customization for API pods. |
@@ -231,7 +231,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin
 | engine.halfPrecision.state | string | `"auto"` | Engine will automatically enable half precision operations if your GPU supports them. You can explicitly enable or disable this behavior with the state parameter which supports `"enable"`, `"disabled"`, and `"auto"`. |
 | engine.image.path | string | `"quay.io/deepgram/self-hosted-engine"` | path configures the image path to use for creating Engine containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. |
 | engine.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image |
-| engine.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for Engine containers |
+| engine.image.tag | string | `"release-241024"` | tag defines which Deepgram release to use for Engine containers |
 | engine.livenessProbe | object | `` | Liveness probe customization for Engine pods. |
 | engine.metricsServer | object | `` | metricsServer exposes an endpoint on each Engine container for reporting inference-specific system metrics. See https://developers.deepgram.com/docs/metrics-guide#deepgram-engine for more details. |
 | engine.metricsServer.host | string | `"0.0.0.0"` | host is the IP address to listen on for metrics requests. You will want to listen on all interfaces to interact with other pods in the cluster. |
@@ -289,7 +289,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin
 | licenseProxy.enabled | bool | `false` | The License Proxy is optional, but highly recommended to be deployed in production to enable highly available environments. |
 | licenseProxy.image.path | string | `"quay.io/deepgram/self-hosted-license-proxy"` | path configures the image path to use for creating License Proxy containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. |
 | licenseProxy.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram License Proxy image |
-| licenseProxy.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for License Proxy containers |
+| licenseProxy.image.tag | string | `"release-241024"` | tag defines which Deepgram release to use for License Proxy containers |
 | licenseProxy.keepUpstreamServerAsBackup | bool | `true` | Even with a License Proxy deployed, API and Engine pods can be configured to keep the upstream `license.deepgram.com` license server as a fallback licensing option if the License Proxy is unavailable. Disable this option if you are restricting API/Engine Pod network access for security reasons, and only the License Proxy should send egress traffic to the upstream license server. |
 | licenseProxy.livenessProbe | object | `` | Liveness probe customization for Proxy pods. |
 | licenseProxy.namePrefix | string | `"deepgram-license-proxy"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram License Proxy containers. |
diff --git a/charts/deepgram-self-hosted/templates/api/api.config.yaml b/charts/deepgram-self-hosted/templates/api/api.config.yaml
index d08b06a..d555e57 100644
--- a/charts/deepgram-self-hosted/templates/api/api.config.yaml
+++ b/charts/deepgram-self-hosted/templates/api/api.config.yaml
@@ -47,6 +47,7 @@ data:
       summarization = true
       entity_detection = {{ .Values.api.features.entityDetection }}
       entity_redaction = {{ .Values.api.features.entityRedaction }}
+      speak_streaming = true
 
       {{- if .Values.api.features.diskBufferPath }}
       disk_buffer_path = "{{ .Values.api.features.diskBufferPath }}"
diff --git a/charts/deepgram-self-hosted/values.yaml b/charts/deepgram-self-hosted/values.yaml
index 029591d..db7b19d 100644
--- a/charts/deepgram-self-hosted/values.yaml
+++ b/charts/deepgram-self-hosted/values.yaml
@@ -112,7 +112,7 @@ api:
     # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram API image
     pullPolicy: IfNotPresent
     # -- tag defines which Deepgram release to use for API containers
-    tag: release-240927
+    tag: release-241024
 
   # -- Additional labels to add to API resources
   additionalLabels: {}
@@ -278,7 +278,7 @@ engine:
     # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image
     pullPolicy: IfNotPresent
     # -- tag defines which Deepgram release to use for Engine containers
-    tag: release-240927
+    tag: release-241024
 
   # -- Additional labels to add to Engine resources
   additionalLabels: {}
@@ -529,7 +529,7 @@ licenseProxy:
     # Deepgram images into a private container registry.
     path: quay.io/deepgram/self-hosted-license-proxy
     # -- tag defines which Deepgram release to use for License Proxy containers
-    tag: release-240927
+    tag: release-241024
     # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram
     # License Proxy image
     pullPolicy: IfNotPresent
diff --git a/common/license_proxy_deploy/api.toml b/common/license_proxy_deploy/api.toml
index c1990df..3eecd83 100644
--- a/common/license_proxy_deploy/api.toml
+++ b/common/license_proxy_deploy/api.toml
@@ -84,6 +84,8 @@ entity_redaction = false # or true
 ### the queue (and response time) will grow indefinitely.
 # disk_buffer_path = "/path/to/disk/buffer/directory"
 
+### Enables streaming TTS *if* a valid Aura TTS model is available
+speak_streaming = true # or false
 
 ### Configure the backend pool of speech engines (generically referred to as
 ### "drivers" here). The API will load-balance among drivers in the standard
diff --git a/common/standard_deploy/api.toml b/common/standard_deploy/api.toml
index 70e10e8..e016235 100644
--- a/common/standard_deploy/api.toml
+++ b/common/standard_deploy/api.toml
@@ -82,6 +82,8 @@ entity_redaction = false # or true
 ### the queue (and response time) will grow indefinitely.
 # disk_buffer_path = "/path/to/disk/buffer/directory"
 
+### Enables streaming TTS *if* a valid Aura TTS model is available
+speak_streaming = true # or false
 
 ### Configure the backend pool of speech engines (generically referred to as
 ### "drivers" here). The API will load-balance among drivers in the standard
diff --git a/docker/docker-compose.license-proxy.yml b/docker/docker-compose.license-proxy.yml
index 883541b..667c859 100644
--- a/docker/docker-compose.license-proxy.yml
+++ b/docker/docker-compose.license-proxy.yml
@@ -9,7 +9,7 @@ x-env: &env
 services:
   # The speech API service.
   api:
-    image: quay.io/deepgram/self-hosted-api:release-240927
+    image: quay.io/deepgram/self-hosted-api:release-241024
 
     # Here we expose the API port to the host machine. The container port
     # (right-hand side) must match the port that the API service is listening
@@ -43,7 +43,7 @@ services:
 
   # The speech engine service.
   engine:
-    image: quay.io/deepgram/self-hosted-engine:release-240927
+    image: quay.io/deepgram/self-hosted-engine:release-241024
 
     # Utilize a GPU, if available.
     runtime: nvidia
@@ -83,7 +83,7 @@ services:
 
   # The service to validate your Deepgram license
   license-proxy:
-    image: quay.io/deepgram/self-hosted-license-proxy:release-240927
+    image: quay.io/deepgram/self-hosted-license-proxy:release-241024
 
     # Here we expose the License Proxy status port to the host machine. The container port
     # (right-hand side) must match the port that the License Proxy service is listening
diff --git a/docker/docker-compose.standard.yml b/docker/docker-compose.standard.yml
index 59611a3..b572b55 100644
--- a/docker/docker-compose.standard.yml
+++ b/docker/docker-compose.standard.yml
@@ -9,7 +9,7 @@ x-env: &env
 services:
   # The speech API service.
   api:
-    image: quay.io/deepgram/self-hosted-api:release-240927
+    image: quay.io/deepgram/self-hosted-api:release-241024
 
     # Here we expose the API port to the host machine. The container port
     # (right-hand side) must match the port that the API service is listening
@@ -39,7 +39,7 @@ services:
 
   # The speech engine service.
   engine:
-    image: quay.io/deepgram/self-hosted-engine:release-240927
+    image: quay.io/deepgram/self-hosted-engine:release-241024
 
     # Utilize a GPU, if available.
     runtime: nvidia
diff --git a/podman/podman-compose.license-proxy.yml b/podman/podman-compose.license-proxy.yml
index 9b1aa40..d346e95 100644
--- a/podman/podman-compose.license-proxy.yml
+++ b/podman/podman-compose.license-proxy.yml
@@ -3,7 +3,7 @@
 services:
   # The speech API service.
   api:
-    image: quay.io/deepgram/self-hosted-api:release-240927
+    image: quay.io/deepgram/self-hosted-api:release-241024
 
     # Here we expose the API port to the host machine. The container port
     # (right-hand side) must match the port that the API service is listening
@@ -40,7 +40,7 @@ services:
 
   # The speech engine service.
   engine:
-    image: quay.io/deepgram/self-hosted-engine:release-240927
+    image: quay.io/deepgram/self-hosted-engine:release-241024
 
     # Utilize a GPU, if available.
     devices:
@@ -84,7 +84,7 @@ services:
 
   # The service to validate your Deepgram license
   license-proxy:
-    image: quay.io/deepgram/self-hosted-license-proxy:release-240927
+    image: quay.io/deepgram/self-hosted-license-proxy:release-241024
 
     # Here we expose the License Proxy status port to the host machine. The container port
     # (right-hand side) must match the port that the License Proxy service is listening
diff --git a/podman/podman-compose.standard.yml b/podman/podman-compose.standard.yml
index 8df4546..e005ef8 100644
--- a/podman/podman-compose.standard.yml
+++ b/podman/podman-compose.standard.yml
@@ -3,7 +3,7 @@
 services:
   # The speech API service.
   api:
-    image: quay.io/deepgram/self-hosted-api:release-240927
+    image: quay.io/deepgram/self-hosted-api:release-241024
 
     # Here we expose the API port to the host machine. The container port
     # (right-hand side) must match the port that the API service is listening
@@ -36,7 +36,7 @@ services:
 
   # The speech engine service.
   engine:
-    image: quay.io/deepgram/self-hosted-engine:release-240927
+    image: quay.io/deepgram/self-hosted-engine:release-241024
 
     # Utilize a GPU, if available.
     devices: