From 30ed8bf55a03adb21a3518dff8c4be546b6445f1 Mon Sep 17 00:00:00 2001 From: Dev Aggarwal Date: Thu, 5 Sep 2024 20:48:26 +0530 Subject: [PATCH] Add deployment configuration for Sea Lion v2.1 model in model-values.yaml --- chart/model-values.yaml | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/chart/model-values.yaml b/chart/model-values.yaml index a32ad6b..07c6423 100644 --- a/chart/model-values.yaml +++ b/chart/model-values.yaml @@ -354,6 +354,17 @@ deployments: LLM_MODEL_IDS: |- aisingapore/llama3-8b-cpt-sea-lionv2-instruct + - name: "common-llms-sealion-v2-1" + image: "crgooeyprodwestus1.azurecr.io/gooey-gpu-common:7" + limits_gpu: "30Gi" + limits: + memory: "80Gi" # (220 / 80) * 30 + env: + IMPORTS: |- + common.llms + LLM_MODEL_IDS: |- + aisingapore/llama3-8b-cpt-sea-lionv2.1-instruct + - name: "common-llms-sarvam-2b" image: "crgooeyprodwestus1.azurecr.io/gooey-gpu-common:7" limits_gpu: "6Gi"