From 6829a4978546082861eb74c9c8201864621c5e4c Mon Sep 17 00:00:00 2001 From: Dev Aggarwal Date: Tue, 13 Aug 2024 01:04:43 +0530 Subject: [PATCH] fix: error when getting metric values no matching metrics found for s0-rabbitmq-gooey-gpu-2ffacebook-2fseamless-m4t-v2-large --- chart/model-values.yaml | 2 +- chart/templates/deployment.yaml | 4 ++++ 2 files changed, 5 insertions(+), 1 deletion(-) diff --git a/chart/model-values.yaml b/chart/model-values.yaml index 3a7e736..b331dcf 100644 --- a/chart/model-values.yaml +++ b/chart/model-values.yaml @@ -203,8 +203,8 @@ deployments: - name: "common-seamless" image: "crgooeyprodwestus1.azurecr.io/gooey-gpu-common:6" + limits_gpu: "10Gi" limits: - gpu: "10Gi" memory: "28Gi" # (220 / 80) * 10 cpu: "1" env: diff --git a/chart/templates/deployment.yaml b/chart/templates/deployment.yaml index 38db280..323f151 100644 --- a/chart/templates/deployment.yaml +++ b/chart/templates/deployment.yaml @@ -50,6 +50,10 @@ spec: - name: "RESOURCE_LIMITS_{{ $name | upper }}" value: "{{ $value }}" {{- end }} + {{- if .limits_gpu }} + - name: "RESOURCE_LIMITS_GPU" + value: "{{ .limits_gpu }}" + {{- end }} livenessProbe: exec: command: [ "bash", "-c", "celery inspect ping -d celery@$HOSTNAME" ]