From cd09206a901a4db7a839ccf709d98bdb72f2fbb6 Mon Sep 17 00:00:00 2001 From: Julia Kroll <135150417+jkroll-deepgram@users.noreply.github.com> Date: Thu, 24 Oct 2024 15:37:13 -0500 Subject: [PATCH] October 2024 release (241024) (#47) --- charts/deepgram-self-hosted/CHANGELOG.md | 10 +++++++++- charts/deepgram-self-hosted/Chart.yaml | 4 ++-- charts/deepgram-self-hosted/README.md | 8 ++++---- .../deepgram-self-hosted/templates/api/api.config.yaml | 1 + charts/deepgram-self-hosted/values.yaml | 6 +++--- common/license_proxy_deploy/api.toml | 2 ++ common/standard_deploy/api.toml | 2 ++ docker/docker-compose.license-proxy.yml | 6 +++--- docker/docker-compose.standard.yml | 4 ++-- podman/podman-compose.license-proxy.yml | 6 +++--- podman/podman-compose.standard.yml | 4 ++-- 11 files changed, 33 insertions(+), 20 deletions(-) diff --git a/charts/deepgram-self-hosted/CHANGELOG.md b/charts/deepgram-self-hosted/CHANGELOG.md index 684f19b..015ac37 100644 --- a/charts/deepgram-self-hosted/CHANGELOG.md +++ b/charts/deepgram-self-hosted/CHANGELOG.md @@ -6,6 +6,13 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/), ## [Unreleased] +## [0.7.0] - 2024-10-24 + +### Added + +- Updated default container tags to October 2024 release. Refer to the [main Deepgram changelog](https://deepgram.com/changelog/deepgram-self-hosted-october-2024-release-241024) for additional details. Highlights include: + - Adds new [streaming websocket TTS](https://deepgram.com/changelog/websocket-text-to-speech-api)! This is a software feature, so no new TTS models are required. + ### Changed - AWS samples updated to take advantage of new [EKS accelerated AMIs](https://aws.amazon.com/about-aws/whats-new/2024/10/amazon-eks-nvidia-aws-neuron-instance-types-al2023/), which bundle the required NVIDIA driver and toolkit instead of being installed by the NVIDIA GPU operator @@ -124,7 +131,8 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/), - Initial implementation of the Helm chart. -[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.6.0...HEAD +[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.7.0...HEAD +[0.7.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.6.0...deepgram-self-hosted-0.7.0 [0.6.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.5.0...deepgram-self-hosted-0.6.0 [0.5.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.4.0...deepgram-self-hosted-0.5.0 [0.4.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.3.0...deepgram-self-hosted-0.4.0 diff --git a/charts/deepgram-self-hosted/Chart.yaml b/charts/deepgram-self-hosted/Chart.yaml index e14218f..7290155 100644 --- a/charts/deepgram-self-hosted/Chart.yaml +++ b/charts/deepgram-self-hosted/Chart.yaml @@ -1,8 +1,8 @@ apiVersion: v2 name: deepgram-self-hosted type: application -version: 0.6.0 -appVersion: "release-240927" +version: 0.7.0 +appVersion: "release-241024" description: A Helm chart for running Deepgram services in a self-hosted environment home: "https://developers.deepgram.com/docs/self-hosted-introduction" sources: ["https://github.com/deepgram/self-hosted-resources"] diff --git a/charts/deepgram-self-hosted/README.md b/charts/deepgram-self-hosted/README.md index d04c681..5a5e2e1 100644 --- a/charts/deepgram-self-hosted/README.md +++ b/charts/deepgram-self-hosted/README.md @@ -1,6 +1,6 @@ # deepgram-self-hosted -![Version: 0.6.0](https://img.shields.io/badge/Version-0.6.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-240927](https://img.shields.io/badge/AppVersion-release--240927-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted) +![Version: 0.7.0](https://img.shields.io/badge/Version-0.7.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-241024](https://img.shields.io/badge/AppVersion-release--241024-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted) A Helm chart for running Deepgram services in a self-hosted environment @@ -192,7 +192,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin | api.features.entityRedaction | bool | `false` | Enables entity-based redaction on pre-recorded audio *if* a valid entity detection model is available. *WARNING*: Beta functionality. | | api.image.path | string | `"quay.io/deepgram/self-hosted-api"` | path configures the image path to use for creating API containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | api.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram API image | -| api.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for API containers | +| api.image.tag | string | `"release-241024"` | tag defines which Deepgram release to use for API containers | | api.livenessProbe | object | `` | Liveness probe customization for API pods. | | api.namePrefix | string | `"deepgram-api"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram API containers. | | api.readinessProbe | object | `` | Readiness probe customization for API pods. | @@ -231,7 +231,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin | engine.halfPrecision.state | string | `"auto"` | Engine will automatically enable half precision operations if your GPU supports them. You can explicitly enable or disable this behavior with the state parameter which supports `"enable"`, `"disabled"`, and `"auto"`. | | engine.image.path | string | `"quay.io/deepgram/self-hosted-engine"` | path configures the image path to use for creating Engine containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | engine.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image | -| engine.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for Engine containers | +| engine.image.tag | string | `"release-241024"` | tag defines which Deepgram release to use for Engine containers | | engine.livenessProbe | object | `` | Liveness probe customization for Engine pods. | | engine.metricsServer | object | `` | metricsServer exposes an endpoint on each Engine container for reporting inference-specific system metrics. See https://developers.deepgram.com/docs/metrics-guide#deepgram-engine for more details. | | engine.metricsServer.host | string | `"0.0.0.0"` | host is the IP address to listen on for metrics requests. You will want to listen on all interfaces to interact with other pods in the cluster. | @@ -289,7 +289,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin | licenseProxy.enabled | bool | `false` | The License Proxy is optional, but highly recommended to be deployed in production to enable highly available environments. | | licenseProxy.image.path | string | `"quay.io/deepgram/self-hosted-license-proxy"` | path configures the image path to use for creating License Proxy containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | licenseProxy.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram License Proxy image | -| licenseProxy.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for License Proxy containers | +| licenseProxy.image.tag | string | `"release-241024"` | tag defines which Deepgram release to use for License Proxy containers | | licenseProxy.keepUpstreamServerAsBackup | bool | `true` | Even with a License Proxy deployed, API and Engine pods can be configured to keep the upstream `license.deepgram.com` license server as a fallback licensing option if the License Proxy is unavailable. Disable this option if you are restricting API/Engine Pod network access for security reasons, and only the License Proxy should send egress traffic to the upstream license server. | | licenseProxy.livenessProbe | object | `` | Liveness probe customization for Proxy pods. | | licenseProxy.namePrefix | string | `"deepgram-license-proxy"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram License Proxy containers. | diff --git a/charts/deepgram-self-hosted/templates/api/api.config.yaml b/charts/deepgram-self-hosted/templates/api/api.config.yaml index d08b06a..d555e57 100644 --- a/charts/deepgram-self-hosted/templates/api/api.config.yaml +++ b/charts/deepgram-self-hosted/templates/api/api.config.yaml @@ -47,6 +47,7 @@ data: summarization = true entity_detection = {{ .Values.api.features.entityDetection }} entity_redaction = {{ .Values.api.features.entityRedaction }} + speak_streaming = true {{- if .Values.api.features.diskBufferPath }} disk_buffer_path = "{{ .Values.api.features.diskBufferPath }}" diff --git a/charts/deepgram-self-hosted/values.yaml b/charts/deepgram-self-hosted/values.yaml index 029591d..db7b19d 100644 --- a/charts/deepgram-self-hosted/values.yaml +++ b/charts/deepgram-self-hosted/values.yaml @@ -112,7 +112,7 @@ api: # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram API image pullPolicy: IfNotPresent # -- tag defines which Deepgram release to use for API containers - tag: release-240927 + tag: release-241024 # -- Additional labels to add to API resources additionalLabels: {} @@ -278,7 +278,7 @@ engine: # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image pullPolicy: IfNotPresent # -- tag defines which Deepgram release to use for Engine containers - tag: release-240927 + tag: release-241024 # -- Additional labels to add to Engine resources additionalLabels: {} @@ -529,7 +529,7 @@ licenseProxy: # Deepgram images into a private container registry. path: quay.io/deepgram/self-hosted-license-proxy # -- tag defines which Deepgram release to use for License Proxy containers - tag: release-240927 + tag: release-241024 # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram # License Proxy image pullPolicy: IfNotPresent diff --git a/common/license_proxy_deploy/api.toml b/common/license_proxy_deploy/api.toml index c1990df..3eecd83 100644 --- a/common/license_proxy_deploy/api.toml +++ b/common/license_proxy_deploy/api.toml @@ -84,6 +84,8 @@ entity_redaction = false # or true ### the queue (and response time) will grow indefinitely. # disk_buffer_path = "/path/to/disk/buffer/directory" +### Enables streaming TTS *if* a valid Aura TTS model is available +speak_streaming = true # or false ### Configure the backend pool of speech engines (generically referred to as ### "drivers" here). The API will load-balance among drivers in the standard diff --git a/common/standard_deploy/api.toml b/common/standard_deploy/api.toml index 70e10e8..e016235 100644 --- a/common/standard_deploy/api.toml +++ b/common/standard_deploy/api.toml @@ -82,6 +82,8 @@ entity_redaction = false # or true ### the queue (and response time) will grow indefinitely. # disk_buffer_path = "/path/to/disk/buffer/directory" +### Enables streaming TTS *if* a valid Aura TTS model is available +speak_streaming = true # or false ### Configure the backend pool of speech engines (generically referred to as ### "drivers" here). The API will load-balance among drivers in the standard diff --git a/docker/docker-compose.license-proxy.yml b/docker/docker-compose.license-proxy.yml index 883541b..667c859 100644 --- a/docker/docker-compose.license-proxy.yml +++ b/docker/docker-compose.license-proxy.yml @@ -9,7 +9,7 @@ x-env: &env services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240927 + image: quay.io/deepgram/self-hosted-api:release-241024 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -43,7 +43,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240927 + image: quay.io/deepgram/self-hosted-engine:release-241024 # Utilize a GPU, if available. runtime: nvidia @@ -83,7 +83,7 @@ services: # The service to validate your Deepgram license license-proxy: - image: quay.io/deepgram/self-hosted-license-proxy:release-240927 + image: quay.io/deepgram/self-hosted-license-proxy:release-241024 # Here we expose the License Proxy status port to the host machine. The container port # (right-hand side) must match the port that the License Proxy service is listening diff --git a/docker/docker-compose.standard.yml b/docker/docker-compose.standard.yml index 59611a3..b572b55 100644 --- a/docker/docker-compose.standard.yml +++ b/docker/docker-compose.standard.yml @@ -9,7 +9,7 @@ x-env: &env services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240927 + image: quay.io/deepgram/self-hosted-api:release-241024 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -39,7 +39,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240927 + image: quay.io/deepgram/self-hosted-engine:release-241024 # Utilize a GPU, if available. runtime: nvidia diff --git a/podman/podman-compose.license-proxy.yml b/podman/podman-compose.license-proxy.yml index 9b1aa40..d346e95 100644 --- a/podman/podman-compose.license-proxy.yml +++ b/podman/podman-compose.license-proxy.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240927 + image: quay.io/deepgram/self-hosted-api:release-241024 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -40,7 +40,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240927 + image: quay.io/deepgram/self-hosted-engine:release-241024 # Utilize a GPU, if available. devices: @@ -84,7 +84,7 @@ services: # The service to validate your Deepgram license license-proxy: - image: quay.io/deepgram/self-hosted-license-proxy:release-240927 + image: quay.io/deepgram/self-hosted-license-proxy:release-241024 # Here we expose the License Proxy status port to the host machine. The container port # (right-hand side) must match the port that the License Proxy service is listening diff --git a/podman/podman-compose.standard.yml b/podman/podman-compose.standard.yml index 8df4546..e005ef8 100644 --- a/podman/podman-compose.standard.yml +++ b/podman/podman-compose.standard.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240927 + image: quay.io/deepgram/self-hosted-api:release-241024 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -36,7 +36,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240927 + image: quay.io/deepgram/self-hosted-engine:release-241024 # Utilize a GPU, if available. devices: