From 23affa5542e3eab7943f2b3aaaf1907282bac413 Mon Sep 17 00:00:00 2001 From: Dolpher Du Date: Thu, 19 Dec 2024 07:35:06 +0000 Subject: [PATCH] Enable norerank and withwrapper config Signed-off-by: Dolpher Du --- helm-charts/chatqna/norerank-values.yaml | 11 +++++++++++ helm-charts/chatqna/templates/deployment.yaml | 12 ++++++++++++ helm-charts/chatqna/withwrapper-values.yaml | 15 +++++++++++++++ 3 files changed, 38 insertions(+) create mode 100644 helm-charts/chatqna/norerank-values.yaml create mode 100644 helm-charts/chatqna/withwrapper-values.yaml diff --git a/helm-charts/chatqna/norerank-values.yaml b/helm-charts/chatqna/norerank-values.yaml new file mode 100644 index 00000000..aa069c1c --- /dev/null +++ b/helm-charts/chatqna/norerank-values.yaml @@ -0,0 +1,11 @@ +# Copyright (C) 2024 Intel Corporation +# SPDX-License-Identifier: Apache-2.0 + +# Accelerate inferencing in heaviest components to improve performance +# by overriding their subchart values + +image: + repository: opea/chatqna-without-rerank + +teirerank: + enabled: false diff --git a/helm-charts/chatqna/templates/deployment.yaml b/helm-charts/chatqna/templates/deployment.yaml index 4a1a1e31..e64f84e9 100644 --- a/helm-charts/chatqna/templates/deployment.yaml +++ b/helm-charts/chatqna/templates/deployment.yaml @@ -64,6 +64,18 @@ spec: value: {{ .Release.Name }}-guardrails-usvc - name: GUARDRAIL_SERVICE_PORT value: "9090" + - name: LLM_SERVICE_HOST_IP + value: {{ .Release.Name }}-llm-uservice + - name: LLM_SERVICE_PORT + value: "9000" + - name: RERANK_SERVICE_HOST_IP + value: {{ .Release.Name }}-reranking-usvc + - name: RERANK_SERVICE_PORT + value: "8000" + - name: EMBEDDING_SERVICE_HOST_IP + value: {{ .Release.Name }}-embedding-usvc + - name: EMBEDDING_SERVICE_PORT + value: "6000" {{- if .Values.LOGFLAG }} - name: LOGFLAG value: {{ .Values.LOGFLAG | quote }} diff --git a/helm-charts/chatqna/withwrapper-values.yaml b/helm-charts/chatqna/withwrapper-values.yaml new file mode 100644 index 00000000..0c0de471 --- /dev/null +++ b/helm-charts/chatqna/withwrapper-values.yaml @@ -0,0 +1,15 @@ +# Copyright (C) 2024 Intel Corporation +# SPDX-License-Identifier: Apache-2.0 + +# Accelerate inferencing in heaviest components to improve performance +# by overriding their subchart values + +image: + repository: opea/chatqna-wrapper + +llm-uservice: + enabled: true +embedding-usvc: + enabled: true +reranking-usvc: + enabled: true