From 721a0dbc7c5af89b7f8e383df32a09d8b96daa04 Mon Sep 17 00:00:00 2001 From: Julia Kroll <135150417+jkroll-deepgram@users.noreply.github.com> Date: Fri, 27 Sep 2024 15:29:05 -0500 Subject: [PATCH] September 2024 release (240927) (#44) --- charts/deepgram-self-hosted/CHANGELOG.md | 8 +++++++- charts/deepgram-self-hosted/Chart.yaml | 4 ++-- charts/deepgram-self-hosted/README.md | 8 ++++---- charts/deepgram-self-hosted/values.yaml | 6 +++--- docker/docker-compose.license-proxy.yml | 6 +++--- docker/docker-compose.standard.yml | 4 ++-- podman/podman-compose.license-proxy.yml | 6 +++--- podman/podman-compose.standard.yml | 4 ++-- 8 files changed, 26 insertions(+), 20 deletions(-) diff --git a/charts/deepgram-self-hosted/CHANGELOG.md b/charts/deepgram-self-hosted/CHANGELOG.md index a3d491b..d189dd8 100644 --- a/charts/deepgram-self-hosted/CHANGELOG.md +++ b/charts/deepgram-self-hosted/CHANGELOG.md @@ -6,8 +6,13 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/), ## [Unreleased] +## [0.6.0] - 2024-09-27 + ### Added +- Updated default container tags to September 2024 release. Refer to the [main Deepgram changelog](https://deepgram.com/changelog/deepgram-self-hosted-september-2024-release-240927) for additional details. Highlights include: + - Adds broader support in Engine container for model auto-loading during runtime. + - Filesystems that don't support `inotify`, such as `nfs`/`csi` PersistentVolumes in Kubernetes, can now load and unload models during runtime without requiring a Pod restart. - Automatic model management on AWS now supports model removal. See the `engine.modelManager.models.remove` section in the `values.yaml` file for details. - Container orchestrator environment variable added to improve support. @@ -115,7 +120,8 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/), - Initial implementation of the Helm chart. -[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.5.0...HEAD +[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.6.0...HEAD +[0.6.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.5.0...deepgram-self-hosted-0.6.0 [0.5.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.4.0...deepgram-self-hosted-0.5.0 [0.4.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.3.0...deepgram-self-hosted-0.4.0 [0.3.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.2.3...deepgram-self-hosted-0.3.0 diff --git a/charts/deepgram-self-hosted/Chart.yaml b/charts/deepgram-self-hosted/Chart.yaml index b38f03f..e14218f 100644 --- a/charts/deepgram-self-hosted/Chart.yaml +++ b/charts/deepgram-self-hosted/Chart.yaml @@ -1,8 +1,8 @@ apiVersion: v2 name: deepgram-self-hosted type: application -version: 0.5.0 -appVersion: "release-240827" +version: 0.6.0 +appVersion: "release-240927" description: A Helm chart for running Deepgram services in a self-hosted environment home: "https://developers.deepgram.com/docs/self-hosted-introduction" sources: ["https://github.com/deepgram/self-hosted-resources"] diff --git a/charts/deepgram-self-hosted/README.md b/charts/deepgram-self-hosted/README.md index 5c88b2f..d04c681 100644 --- a/charts/deepgram-self-hosted/README.md +++ b/charts/deepgram-self-hosted/README.md @@ -1,6 +1,6 @@ # deepgram-self-hosted -![Version: 0.5.0](https://img.shields.io/badge/Version-0.5.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-240827](https://img.shields.io/badge/AppVersion-release--240827-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted) +![Version: 0.6.0](https://img.shields.io/badge/Version-0.6.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-240927](https://img.shields.io/badge/AppVersion-release--240927-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted) A Helm chart for running Deepgram services in a self-hosted environment @@ -192,7 +192,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin | api.features.entityRedaction | bool | `false` | Enables entity-based redaction on pre-recorded audio *if* a valid entity detection model is available. *WARNING*: Beta functionality. | | api.image.path | string | `"quay.io/deepgram/self-hosted-api"` | path configures the image path to use for creating API containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | api.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram API image | -| api.image.tag | string | `"release-240827"` | tag defines which Deepgram release to use for API containers | +| api.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for API containers | | api.livenessProbe | object | `` | Liveness probe customization for API pods. | | api.namePrefix | string | `"deepgram-api"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram API containers. | | api.readinessProbe | object | `` | Readiness probe customization for API pods. | @@ -231,7 +231,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin | engine.halfPrecision.state | string | `"auto"` | Engine will automatically enable half precision operations if your GPU supports them. You can explicitly enable or disable this behavior with the state parameter which supports `"enable"`, `"disabled"`, and `"auto"`. | | engine.image.path | string | `"quay.io/deepgram/self-hosted-engine"` | path configures the image path to use for creating Engine containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | engine.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image | -| engine.image.tag | string | `"release-240827"` | tag defines which Deepgram release to use for Engine containers | +| engine.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for Engine containers | | engine.livenessProbe | object | `` | Liveness probe customization for Engine pods. | | engine.metricsServer | object | `` | metricsServer exposes an endpoint on each Engine container for reporting inference-specific system metrics. See https://developers.deepgram.com/docs/metrics-guide#deepgram-engine for more details. | | engine.metricsServer.host | string | `"0.0.0.0"` | host is the IP address to listen on for metrics requests. You will want to listen on all interfaces to interact with other pods in the cluster. | @@ -289,7 +289,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin | licenseProxy.enabled | bool | `false` | The License Proxy is optional, but highly recommended to be deployed in production to enable highly available environments. | | licenseProxy.image.path | string | `"quay.io/deepgram/self-hosted-license-proxy"` | path configures the image path to use for creating License Proxy containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | licenseProxy.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram License Proxy image | -| licenseProxy.image.tag | string | `"release-240827"` | tag defines which Deepgram release to use for License Proxy containers | +| licenseProxy.image.tag | string | `"release-240927"` | tag defines which Deepgram release to use for License Proxy containers | | licenseProxy.keepUpstreamServerAsBackup | bool | `true` | Even with a License Proxy deployed, API and Engine pods can be configured to keep the upstream `license.deepgram.com` license server as a fallback licensing option if the License Proxy is unavailable. Disable this option if you are restricting API/Engine Pod network access for security reasons, and only the License Proxy should send egress traffic to the upstream license server. | | licenseProxy.livenessProbe | object | `` | Liveness probe customization for Proxy pods. | | licenseProxy.namePrefix | string | `"deepgram-license-proxy"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram License Proxy containers. | diff --git a/charts/deepgram-self-hosted/values.yaml b/charts/deepgram-self-hosted/values.yaml index 99418cd..029591d 100644 --- a/charts/deepgram-self-hosted/values.yaml +++ b/charts/deepgram-self-hosted/values.yaml @@ -112,7 +112,7 @@ api: # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram API image pullPolicy: IfNotPresent # -- tag defines which Deepgram release to use for API containers - tag: release-240827 + tag: release-240927 # -- Additional labels to add to API resources additionalLabels: {} @@ -278,7 +278,7 @@ engine: # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image pullPolicy: IfNotPresent # -- tag defines which Deepgram release to use for Engine containers - tag: release-240827 + tag: release-240927 # -- Additional labels to add to Engine resources additionalLabels: {} @@ -529,7 +529,7 @@ licenseProxy: # Deepgram images into a private container registry. path: quay.io/deepgram/self-hosted-license-proxy # -- tag defines which Deepgram release to use for License Proxy containers - tag: release-240827 + tag: release-240927 # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram # License Proxy image pullPolicy: IfNotPresent diff --git a/docker/docker-compose.license-proxy.yml b/docker/docker-compose.license-proxy.yml index 373e37c..883541b 100644 --- a/docker/docker-compose.license-proxy.yml +++ b/docker/docker-compose.license-proxy.yml @@ -9,7 +9,7 @@ x-env: &env services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240827 + image: quay.io/deepgram/self-hosted-api:release-240927 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -43,7 +43,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240827 + image: quay.io/deepgram/self-hosted-engine:release-240927 # Utilize a GPU, if available. runtime: nvidia @@ -83,7 +83,7 @@ services: # The service to validate your Deepgram license license-proxy: - image: quay.io/deepgram/self-hosted-license-proxy:release-240827 + image: quay.io/deepgram/self-hosted-license-proxy:release-240927 # Here we expose the License Proxy status port to the host machine. The container port # (right-hand side) must match the port that the License Proxy service is listening diff --git a/docker/docker-compose.standard.yml b/docker/docker-compose.standard.yml index 9ab795b..59611a3 100644 --- a/docker/docker-compose.standard.yml +++ b/docker/docker-compose.standard.yml @@ -9,7 +9,7 @@ x-env: &env services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240827 + image: quay.io/deepgram/self-hosted-api:release-240927 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -39,7 +39,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240827 + image: quay.io/deepgram/self-hosted-engine:release-240927 # Utilize a GPU, if available. runtime: nvidia diff --git a/podman/podman-compose.license-proxy.yml b/podman/podman-compose.license-proxy.yml index 5418083..9b1aa40 100644 --- a/podman/podman-compose.license-proxy.yml +++ b/podman/podman-compose.license-proxy.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240827 + image: quay.io/deepgram/self-hosted-api:release-240927 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -40,7 +40,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240827 + image: quay.io/deepgram/self-hosted-engine:release-240927 # Utilize a GPU, if available. devices: @@ -84,7 +84,7 @@ services: # The service to validate your Deepgram license license-proxy: - image: quay.io/deepgram/self-hosted-license-proxy:release-240827 + image: quay.io/deepgram/self-hosted-license-proxy:release-240927 # Here we expose the License Proxy status port to the host machine. The container port # (right-hand side) must match the port that the License Proxy service is listening diff --git a/podman/podman-compose.standard.yml b/podman/podman-compose.standard.yml index 878bcfa..8df4546 100644 --- a/podman/podman-compose.standard.yml +++ b/podman/podman-compose.standard.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/self-hosted-api:release-240827 + image: quay.io/deepgram/self-hosted-api:release-240927 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -36,7 +36,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/self-hosted-engine:release-240827 + image: quay.io/deepgram/self-hosted-engine:release-240927 # Utilize a GPU, if available. devices: