From 91987dcfa80e18fc8d93f792e89b0793862b74f3 Mon Sep 17 00:00:00 2001 From: Julia Kroll <135150417+jkroll-deepgram@users.noreply.github.com> Date: Tue, 27 Aug 2024 15:20:56 -0500 Subject: [PATCH] release-240827, including onprem to self-hosted rename (#40) --- charts/deepgram-self-hosted/CHANGELOG.md | 15 ++++++++++++++- charts/deepgram-self-hosted/Chart.yaml | 4 ++-- charts/deepgram-self-hosted/README.md | 20 ++++++++++---------- charts/deepgram-self-hosted/README.md.gotmpl | 2 +- charts/deepgram-self-hosted/values.yaml | 16 ++++++++-------- docker/README.md | 2 +- docker/docker-compose.license-proxy.yml | 18 +++++++++--------- docker/docker-compose.standard.yml | 12 ++++++------ podman/README.md | 2 +- podman/podman-compose.license-proxy.yml | 18 +++++++++--------- podman/podman-compose.standard.yml | 12 ++++++------ 11 files changed, 67 insertions(+), 54 deletions(-) diff --git a/charts/deepgram-self-hosted/CHANGELOG.md b/charts/deepgram-self-hosted/CHANGELOG.md index cc63a92..280984c 100644 --- a/charts/deepgram-self-hosted/CHANGELOG.md +++ b/charts/deepgram-self-hosted/CHANGELOG.md @@ -6,10 +6,22 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/), ## [Unreleased] +## [0.5.0] - 2024-08-27 + +### Added + +- Updated default container tags to August 2024 release. Refer to the [main Deepgram changelog](https://deepgram.com/changelog/deepgram-self-hosted-august-2024-release-240827) for additional details. Highlights include: + - GA support for entity detection for pre-recorded English audio + - GA support for improved redaction for pre-recorded English audio + ### Fixed - Fixed a misleading comment in the `03-basic-setup-onprem.yaml` sample file that wrongly suggested `engine.modelManager.volumes.customVolumeClaim.name` should be a `PersistentVolume` instead of a `PersistentVolumeClaim` +### Changed + +- Deepgram's core products are available to host both on-premises and in the cloud. Official resources have been updated to refer to a ["self-hosted" product offering](https://deepgram.com/self-hosted), instead of an "onprem" product offering, to align the product name with industry naming standards. The Deepgram Quay image repository names have been updated to reflect this. + ## [0.4.0] - 2024-07-25 ### Added @@ -88,7 +100,8 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/), - Initial implementation of the Helm chart. -[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.4.0...HEAD +[unreleased]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.5.0...HEAD +[0.5.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.4.0...deepgram-self-hosted-0.5.0 [0.4.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.3.0...deepgram-self-hosted-0.4.0 [0.3.0]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.2.3...deepgram-self-hosted-0.3.0 [0.2.3]: https://github.com/deepgram/self-hosted-resources/compare/deepgram-self-hosted-0.2.2-beta...deepgram-self-hosted-0.2.3 diff --git a/charts/deepgram-self-hosted/Chart.yaml b/charts/deepgram-self-hosted/Chart.yaml index 697e516..b38f03f 100644 --- a/charts/deepgram-self-hosted/Chart.yaml +++ b/charts/deepgram-self-hosted/Chart.yaml @@ -1,8 +1,8 @@ apiVersion: v2 name: deepgram-self-hosted type: application -version: 0.4.0 -appVersion: "release-240725" +version: 0.5.0 +appVersion: "release-240827" description: A Helm chart for running Deepgram services in a self-hosted environment home: "https://developers.deepgram.com/docs/self-hosted-introduction" sources: ["https://github.com/deepgram/self-hosted-resources"] diff --git a/charts/deepgram-self-hosted/README.md b/charts/deepgram-self-hosted/README.md index c611e03..d164adc 100644 --- a/charts/deepgram-self-hosted/README.md +++ b/charts/deepgram-self-hosted/README.md @@ -1,6 +1,6 @@ # deepgram-self-hosted -![Version: 0.4.0](https://img.shields.io/badge/Version-0.4.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-240725](https://img.shields.io/badge/AppVersion-release--240725-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted) +![Version: 0.5.0](https://img.shields.io/badge/Version-0.5.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: release-240827](https://img.shields.io/badge/AppVersion-release--240827-informational?style=flat-square) [![Artifact Hub](https://img.shields.io/endpoint?url=https://artifacthub.io/badge/repository/deepgram-self-hosted)](https://artifacthub.io/packages/search?repo=deepgram-self-hosted) A Helm chart for running Deepgram services in a self-hosted environment @@ -36,7 +36,7 @@ helm repo update The Deepgram self-hosted chart requires Helm 3.7+ in order to install successfully. Please check your helm release before installation. -You will need to provide your [self-service Deepgram licensing and credentials](https://developers.deepgram.com/docs/on-prem-self-service-tutorial) information. See `global.deepgramSecretRef` and `global.pullSecretRef` in the [Values section](#values) for more details, and the [Deepgram Self-Hosted Kubernetes Guides](https://developers.deepgram.com/docs/kubernetes) for instructions on how to create these secrets. +You will need to provide your [self-service Deepgram licensing and credentials](https://developers.deepgram.com/docs/self-hosted-self-service-tutorial) information. See `global.deepgramSecretRef` and `global.pullSecretRef` in the [Values section](#values) for more details, and the [Deepgram Self-Hosted Kubernetes Guides](https://developers.deepgram.com/docs/kubernetes) for instructions on how to create these secrets. You may also override any default configuration values. See [the Values section](#values) for a list of available options, and the [samples directory](./samples) for examples of a standard installation. @@ -190,16 +190,16 @@ If you encounter issues while deploying or using Deepgram, consider the followin | api.features.diskBufferPath | string | `nil` | If API is receiving requests faster than Engine can process them, a request queue will form. By default, this queue is stored in memory. Under high load, the queue may grow too large and cause Out-Of-Memory errors. To avoid this, set a diskBufferPath to buffer the overflow on the request queue to disk. WARN: This is only to temporarily buffer requests during high load. If there is not enough Engine capacity to process the queued requests over time, the queue (and response time) will grow indefinitely. | | api.features.entityDetection | bool | `false` | Enables entity detection on pre-recorded audio *if* a valid entity detection model is available. *WARNING*: Beta functionality. | | api.features.entityRedaction | bool | `false` | Enables entity-based redaction on pre-recorded audio *if* a valid entity detection model is available. *WARNING*: Beta functionality. | -| api.image.path | string | `"quay.io/deepgram/onprem-api"` | path configures the image path to use for creating API containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | +| api.image.path | string | `"quay.io/deepgram/self-hosted-api"` | path configures the image path to use for creating API containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | api.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram API image | -| api.image.tag | string | `"release-240725"` | tag defines which Deepgram release to use for API containers | +| api.image.tag | string | `"release-240827"` | tag defines which Deepgram release to use for API containers | | api.livenessProbe | object | `` | Liveness probe customization for API pods. | | api.namePrefix | string | `"deepgram-api"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram API containers. | | api.readinessProbe | object | `` | Readiness probe customization for API pods. | | api.resolver | object | `` | Specify custom DNS resolution options. | | api.resolver.maxTTL | int | `nil` | maxTTL sets the DNS TTL value if specifying a custom DNS nameserver. | | api.resolver.nameservers | list | `[]` | nameservers allows for specifying custom domain name server(s). A valid list item's format is "{IP} {PORT} {PROTOCOL (tcp or udp)}", e.g. `"127.0.0.1 53 udp"`. | -| api.resources | object | `` | Configure resource limits per API container. See [Deepgram's documentation](https://developers.deepgram.com/docs/on-prem-deployment-environments#api) for more details. | +| api.resources | object | `` | Configure resource limits per API container. See [Deepgram's documentation](https://developers.deepgram.com/docs/self-hosted-deployment-environments#api) for more details. | | api.securityContext | object | `{}` | [Security context](https://kubernetes.io/docs/tasks/configure-pod-container/security-context/) for API pods. | | api.server | object | `` | Configure how the API will listen for your requests | | api.server.callbackConnTimeout | string | `"1s"` | callbackConnTimeout configures how long to wait for a connection to a callback URL. See [Deepgram's callback documentation](https://developers.deepgram.com/docs/callback) for more details. The value should be a humantime duration. | @@ -229,9 +229,9 @@ If you encounter issues while deploying or using Deepgram, consider the followin | engine.chunking.speechToText.streaming.step | float | `1` | step defines how often to return interim results, in seconds. This value may be lowered to increase the frequency of interim results. However, this also causes a significant decrease in the number of concurrent streams supported by a single GPU. Please contact your Deepgram Account representative for more details. | | engine.concurrencyLimit.activeRequests | int | `nil` | activeRequests limits the number of active requests handled by a single Engine container. If additional requests beyond the limit are sent, the API container forming the request will try a different Engine pod. If no Engine pods are able to accept the request, the API will return a 429 HTTP response to the client. The `nil` default means no limit will be set. | | engine.halfPrecision.state | string | `"auto"` | Engine will automatically enable half precision operations if your GPU supports them. You can explicitly enable or disable this behavior with the state parameter which supports `"enable"`, `"disabled"`, and `"auto"`. | -| engine.image.path | string | `"quay.io/deepgram/onprem-engine"` | path configures the image path to use for creating Engine containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | +| engine.image.path | string | `"quay.io/deepgram/self-hosted-engine"` | path configures the image path to use for creating Engine containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | engine.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image | -| engine.image.tag | string | `"release-240725"` | tag defines which Deepgram release to use for Engine containers | +| engine.image.tag | string | `"release-240827"` | tag defines which Deepgram release to use for Engine containers | | engine.livenessProbe | object | `` | Liveness probe customization for Engine pods. | | engine.metricsServer | object | `` | metricsServer exposes an endpoint on each Engine container for reporting inference-specific system metrics. See https://developers.deepgram.com/docs/metrics-guide#deepgram-engine for more details. | | engine.metricsServer.host | string | `"0.0.0.0"` | host is the IP address to listen on for metrics requests. You will want to listen on all interfaces to interact with other pods in the cluster. | @@ -252,7 +252,7 @@ If you encounter issues while deploying or using Deepgram, consider the followin | engine.modelManager.volumes.gcp.gpd.volumeHandle | string | `""` | The identifier of your pre-existing persistent disk. The format is projects/{project_id}/zones/{zone_name}/disks/{disk_name} for Zonal persistent disks, or projects/{project_id}/regions/{region_name}/disks/{disk_name} for Regional persistent disks. | | engine.namePrefix | string | `"deepgram-engine"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram Engine containers. | | engine.readinessProbe | object | `` | Readiness probe customization for Engine pods. | -| engine.resources | object | `` | Configure resource limits per Engine container. See [Deepgram's documentation](https://developers.deepgram.com/docs/on-prem-deployment-environments#engine) for more details. | +| engine.resources | object | `` | Configure resource limits per Engine container. See [Deepgram's documentation](https://developers.deepgram.com/docs/self-hosted-deployment-environments#engine) for more details. | | engine.resources.limits.gpu | int | `1` | gpu maps to the nvidia.com/gpu resource parameter | | engine.resources.requests.gpu | int | `1` | gpu maps to the nvidia.com/gpu resource parameter | | engine.securityContext | object | `{}` | [Security context](https://kubernetes.io/docs/tasks/configure-pod-container/security-context/) for API pods. | @@ -285,9 +285,9 @@ If you encounter issues while deploying or using Deepgram, consider the followin | licenseProxy.affinity | object | `{}` | [Affinity and anti-affinity](https://kubernetes.io/docs/concepts/scheduling-eviction/assign-pod-node/#affinity-and-anti-affinity) to apply for License Proxy pods. | | licenseProxy.deploySecondReplica | bool | `false` | If the License Proxy is deployed, one replica should be sufficient to support many API/Engine pods. Highly available environments may wish to deploy a second replica to ensure uptime, which can be toggled with this option. | | licenseProxy.enabled | bool | `false` | The License Proxy is optional, but highly recommended to be deployed in production to enable highly available environments. | -| licenseProxy.image.path | string | `"quay.io/deepgram/onprem-license-proxy"` | path configures the image path to use for creating License Proxy containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | +| licenseProxy.image.path | string | `"quay.io/deepgram/self-hosted-license-proxy"` | path configures the image path to use for creating License Proxy containers. You may change this from the public Quay image path if you have imported Deepgram images into a private container registry. | | licenseProxy.image.pullPolicy | string | `"IfNotPresent"` | pullPolicy configures how the Kubelet attempts to pull the Deepgram License Proxy image | -| licenseProxy.image.tag | string | `"release-240725"` | tag defines which Deepgram release to use for License Proxy containers | +| licenseProxy.image.tag | string | `"release-240827"` | tag defines which Deepgram release to use for License Proxy containers | | licenseProxy.keepUpstreamServerAsBackup | bool | `true` | Even with a License Proxy deployed, API and Engine pods can be configured to keep the upstream `license.deepgram.com` license server as a fallback licensing option if the License Proxy is unavailable. Disable this option if you are restricting API/Engine Pod network access for security reasons, and only the License Proxy should send egress traffic to the upstream license server. | | licenseProxy.livenessProbe | object | `` | Liveness probe customization for Proxy pods. | | licenseProxy.namePrefix | string | `"deepgram-license-proxy"` | namePrefix is the prefix to apply to the name of all K8s objects associated with the Deepgram License Proxy containers. | diff --git a/charts/deepgram-self-hosted/README.md.gotmpl b/charts/deepgram-self-hosted/README.md.gotmpl index a273711..afc6dfe 100644 --- a/charts/deepgram-self-hosted/README.md.gotmpl +++ b/charts/deepgram-self-hosted/README.md.gotmpl @@ -26,7 +26,7 @@ helm repo update The Deepgram self-hosted chart requires Helm 3.7+ in order to install successfully. Please check your helm release before installation. -You will need to provide your [self-service Deepgram licensing and credentials](https://developers.deepgram.com/docs/on-prem-self-service-tutorial) information. See `global.deepgramSecretRef` and `global.pullSecretRef` in the [Values section](#values) for more details, and the [Deepgram Self-Hosted Kubernetes Guides](https://developers.deepgram.com/docs/kubernetes) for instructions on how to create these secrets. +You will need to provide your [self-service Deepgram licensing and credentials](https://developers.deepgram.com/docs/self-hosted-self-service-tutorial) information. See `global.deepgramSecretRef` and `global.pullSecretRef` in the [Values section](#values) for more details, and the [Deepgram Self-Hosted Kubernetes Guides](https://developers.deepgram.com/docs/kubernetes) for instructions on how to create these secrets. You may also override any default configuration values. See [the Values section](#values) for a list of available options, and the [samples directory](./samples) for examples of a standard installation. diff --git a/charts/deepgram-self-hosted/values.yaml b/charts/deepgram-self-hosted/values.yaml index 1cad41f..839ce14 100644 --- a/charts/deepgram-self-hosted/values.yaml +++ b/charts/deepgram-self-hosted/values.yaml @@ -108,11 +108,11 @@ api: # -- path configures the image path to use for creating API containers. # You may change this from the public Quay image path if you have imported # Deepgram images into a private container registry. - path: quay.io/deepgram/onprem-api + path: quay.io/deepgram/self-hosted-api # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram API image pullPolicy: IfNotPresent # -- tag defines which Deepgram release to use for API containers - tag: release-240725 + tag: release-240827 # -- Additional labels to add to API resources additionalLabels: {} @@ -134,7 +134,7 @@ api: maxSurge: 1 # -- Configure resource limits per API container. See - # [Deepgram's documentation](https://developers.deepgram.com/docs/on-prem-deployment-environments#api) + # [Deepgram's documentation](https://developers.deepgram.com/docs/self-hosted-deployment-environments#api) # for more details. # @default -- `` resources: @@ -274,11 +274,11 @@ engine: # -- path configures the image path to use for creating Engine containers. # You may change this from the public Quay image path if you have imported # Deepgram images into a private container registry. - path: quay.io/deepgram/onprem-engine + path: quay.io/deepgram/self-hosted-engine # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram Engine image pullPolicy: IfNotPresent # -- tag defines which Deepgram release to use for Engine containers - tag: release-240725 + tag: release-240827 # -- Additional labels to add to Engine resources additionalLabels: {} @@ -300,7 +300,7 @@ engine: maxSurge: 1 # -- Configure resource limits per Engine container. See - # [Deepgram's documentation](https://developers.deepgram.com/docs/on-prem-deployment-environments#engine) + # [Deepgram's documentation](https://developers.deepgram.com/docs/self-hosted-deployment-environments#engine) # for more details. # @default -- `` resources: @@ -518,9 +518,9 @@ licenseProxy: # -- path configures the image path to use for creating License Proxy containers. # You may change this from the public Quay image path if you have imported # Deepgram images into a private container registry. - path: quay.io/deepgram/onprem-license-proxy + path: quay.io/deepgram/self-hosted-license-proxy # -- tag defines which Deepgram release to use for License Proxy containers - tag: release-240725 + tag: release-240827 # -- pullPolicy configures how the Kubelet attempts to pull the Deepgram # License Proxy image pullPolicy: IfNotPresent diff --git a/docker/README.md b/docker/README.md index 40a6431..1f14c90 100644 --- a/docker/README.md +++ b/docker/README.md @@ -17,7 +17,7 @@ There are several [Docker Compose](https://docs.docker.com/compose/) templates f * `/path/to/engine.toml` * `/path/to/models` * `/path/to/license-proxy.toml`, if applicable -4. Export your [Deepgram self-hosted API key](https://developers.deepgram.com/docs/on-prem-self-service-tutorial#create-an-on-prem-api-key) in your deployment environment. +4. Export your [Deepgram self-hosted API key](https://developers.deepgram.com/docs/self-hosted-self-service-tutorial#create-a-self-hosted-api-key) in your deployment environment. ```bash $ export DEEPGRAM_API_KEY= ``` diff --git a/docker/docker-compose.license-proxy.yml b/docker/docker-compose.license-proxy.yml index 163a12c..b48191d 100644 --- a/docker/docker-compose.license-proxy.yml +++ b/docker/docker-compose.license-proxy.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/onprem-api:release-240725 + image: quay.io/deepgram/self-hosted-api:release-240827 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -11,7 +11,7 @@ services: ports: - "8080:8080" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -26,7 +26,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: @@ -39,7 +39,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/onprem-engine:release-240725 + image: quay.io/deepgram/self-hosted-engine:release-240827 # Utilize a GPU, if available. runtime: nvidia @@ -47,7 +47,7 @@ services: ports: - "9991:9991" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -64,7 +64,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: @@ -81,7 +81,7 @@ services: # The service to validate your Deepgram license license-proxy: - image: quay.io/deepgram/onprem-license-proxy:release-240725 + image: quay.io/deepgram/self-hosted-license-proxy:release-240827 # Here we expose the License Proxy status port to the host machine. The container port # (right-hand side) must match the port that the License Proxy service is listening @@ -89,7 +89,7 @@ services: ports: - "8089:8080" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -104,7 +104,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: diff --git a/docker/docker-compose.standard.yml b/docker/docker-compose.standard.yml index b6a1bf8..3d4c16a 100644 --- a/docker/docker-compose.standard.yml +++ b/docker/docker-compose.standard.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/onprem-api:release-240725 + image: quay.io/deepgram/self-hosted-api:release-240827 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -11,7 +11,7 @@ services: ports: - "8080:8080" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -26,7 +26,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: @@ -35,7 +35,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/onprem-engine:release-240725 + image: quay.io/deepgram/self-hosted-engine:release-240827 # Utilize a GPU, if available. runtime: nvidia @@ -43,7 +43,7 @@ services: ports: - "9991:9991" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -60,7 +60,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: diff --git a/podman/README.md b/podman/README.md index d88acc3..3765266 100644 --- a/podman/README.md +++ b/podman/README.md @@ -17,7 +17,7 @@ There are several [Podman Compose](https://github.com/containers/podman-compose) * `/path/to/engine.toml` * `/path/to/models` * `/path/to/license-proxy.toml`, if applicable -4. Export your [Deepgram self-hosted API key](https://developers.deepgram.com/docs/on-prem-self-service-tutorial#create-an-on-prem-api-key) in your deployment environment. +4. Export your [Deepgram self-hosted API key](https://developers.deepgram.com/docs/self-hosted-self-service-tutorial#create-a-self-hosted-api-key) in your deployment environment. ```bash $ export DEEPGRAM_API_KEY= ``` diff --git a/podman/podman-compose.license-proxy.yml b/podman/podman-compose.license-proxy.yml index ed3841a..5c7e7f8 100644 --- a/podman/podman-compose.license-proxy.yml +++ b/podman/podman-compose.license-proxy.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/onprem-api:release-240725 + image: quay.io/deepgram/self-hosted-api:release-240827 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -11,7 +11,7 @@ services: ports: - "8080:8080" - # Make sure you `export` your onprem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -26,7 +26,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: @@ -39,7 +39,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/onprem-engine:release-240725 + image: quay.io/deepgram/self-hosted-engine:release-240827 # Utilize a GPU, if available. devices: @@ -48,7 +48,7 @@ services: ports: - "9991:9991" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -65,7 +65,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: @@ -82,7 +82,7 @@ services: # The service to validate your Deepgram license license-proxy: - image: quay.io/deepgram/onprem-license-proxy:release-240725 + image: quay.io/deepgram/self-hosted-license-proxy:release-240827 # Here we expose the License Proxy status port to the host machine. The container port # (right-hand side) must match the port that the License Proxy service is listening @@ -90,7 +90,7 @@ services: ports: - "8089:8080" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -105,7 +105,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: diff --git a/podman/podman-compose.standard.yml b/podman/podman-compose.standard.yml index 522bb62..1bca3cb 100644 --- a/podman/podman-compose.standard.yml +++ b/podman/podman-compose.standard.yml @@ -3,7 +3,7 @@ services: # The speech API service. api: - image: quay.io/deepgram/onprem-api:release-240725 + image: quay.io/deepgram/self-hosted-api:release-240827 # Here we expose the API port to the host machine. The container port # (right-hand side) must match the port that the API service is listening @@ -11,7 +11,7 @@ services: ports: - "8080:8080" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -26,7 +26,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: @@ -35,7 +35,7 @@ services: # The speech engine service. engine: - image: quay.io/deepgram/onprem-engine:release-240725 + image: quay.io/deepgram/self-hosted-engine:release-240827 # Utilize a GPU, if available. devices: @@ -44,7 +44,7 @@ services: ports: - "9991:9991" - # Make sure you `export` your on-prem API key secret in your local environment + # Make sure you `export` your self-hosted API key secret in your local environment environment: DEEPGRAM_API_KEY: "${DEEPGRAM_API_KEY}" @@ -61,7 +61,7 @@ services: # Default resource limits. Increase as needed. # For more details, see: - # https://developers.deepgram.com/docs/on-prem-deployment-environments#hardware-specifications + # https://developers.deepgram.com/docs/self-hosted-deployment-environments#hardware-specifications deploy: resources: limits: