From 2f5fa2b91581e40a3480f633d2bfb5c55c6121df Mon Sep 17 00:00:00 2001 From: Zhenzhong1 <109137058+Zhenzhong1@users.noreply.github.com> Date: Thu, 19 Sep 2024 11:03:10 +0800 Subject: [PATCH] [ChatQnA] Update OOB with wrapper manifests. (#823) --- .../with_rerank/four_gaudi/oob_four_gaudi_with_rerank.yaml | 4 ---- .../single_gaudi/oob_single_gaudi_with_rerank.yaml | 4 ---- .../oob/with_rerank/two_gaudi/oob_two_gaudi_with_rerank.yaml | 4 ---- .../four_gaudi/oob_four_gaudi_without_rerank.yaml | 4 ---- .../single_gaudi/oob_single_gaudi_without_rerank.yaml | 4 ---- .../two_gaudi/oob_two_gaudi_without_rerank.yaml | 4 ---- 6 files changed, 24 deletions(-) diff --git a/ChatQnA/benchmark/oob/with_rerank/four_gaudi/oob_four_gaudi_with_rerank.yaml b/ChatQnA/benchmark/oob/with_rerank/four_gaudi/oob_four_gaudi_with_rerank.yaml index 85866573f1..c447bcec29 100644 --- a/ChatQnA/benchmark/oob/with_rerank/four_gaudi/oob_four_gaudi_with_rerank.yaml +++ b/ChatQnA/benchmark/oob/with_rerank/four_gaudi/oob_four_gaudi_with_rerank.yaml @@ -275,10 +275,6 @@ spec: - '2048' - --max-total-tokens - '4096' - - --max-batch-total-tokens - - '65536' - - --max-batch-prefill-tokens - - '4096' env: - name: OMPI_MCA_btl_vader_single_copy_mechanism value: none diff --git a/ChatQnA/benchmark/oob/with_rerank/single_gaudi/oob_single_gaudi_with_rerank.yaml b/ChatQnA/benchmark/oob/with_rerank/single_gaudi/oob_single_gaudi_with_rerank.yaml index eb63aada5f..859568ef97 100644 --- a/ChatQnA/benchmark/oob/with_rerank/single_gaudi/oob_single_gaudi_with_rerank.yaml +++ b/ChatQnA/benchmark/oob/with_rerank/single_gaudi/oob_single_gaudi_with_rerank.yaml @@ -275,10 +275,6 @@ spec: - '2048' - --max-total-tokens - '4096' - - --max-batch-total-tokens - - '65536' - - --max-batch-prefill-tokens - - '4096' env: - name: OMPI_MCA_btl_vader_single_copy_mechanism value: none diff --git a/ChatQnA/benchmark/oob/with_rerank/two_gaudi/oob_two_gaudi_with_rerank.yaml b/ChatQnA/benchmark/oob/with_rerank/two_gaudi/oob_two_gaudi_with_rerank.yaml index 1b9bf7ebfe..b64263be1c 100644 --- a/ChatQnA/benchmark/oob/with_rerank/two_gaudi/oob_two_gaudi_with_rerank.yaml +++ b/ChatQnA/benchmark/oob/with_rerank/two_gaudi/oob_two_gaudi_with_rerank.yaml @@ -275,10 +275,6 @@ spec: - '2048' - --max-total-tokens - '4096' - - --max-batch-total-tokens - - '65536' - - --max-batch-prefill-tokens - - '4096' env: - name: OMPI_MCA_btl_vader_single_copy_mechanism value: none diff --git a/ChatQnA/benchmark/oob/without_rerank/four_gaudi/oob_four_gaudi_without_rerank.yaml b/ChatQnA/benchmark/oob/without_rerank/four_gaudi/oob_four_gaudi_without_rerank.yaml index e010496b8f..6869a78f13 100644 --- a/ChatQnA/benchmark/oob/without_rerank/four_gaudi/oob_four_gaudi_without_rerank.yaml +++ b/ChatQnA/benchmark/oob/without_rerank/four_gaudi/oob_four_gaudi_without_rerank.yaml @@ -336,10 +336,6 @@ spec: - '2048' - --max-total-tokens - '4096' - - --max-batch-total-tokens - - '65536' - - --max-batch-prefill-tokens - - '4096' volumeMounts: - mountPath: /data name: model-volume diff --git a/ChatQnA/benchmark/oob/without_rerank/single_gaudi/oob_single_gaudi_without_rerank.yaml b/ChatQnA/benchmark/oob/without_rerank/single_gaudi/oob_single_gaudi_without_rerank.yaml index b75e8f291a..f38efbeb63 100644 --- a/ChatQnA/benchmark/oob/without_rerank/single_gaudi/oob_single_gaudi_without_rerank.yaml +++ b/ChatQnA/benchmark/oob/without_rerank/single_gaudi/oob_single_gaudi_without_rerank.yaml @@ -336,10 +336,6 @@ spec: - '2048' - --max-total-tokens - '4096' - - --max-batch-total-tokens - - '65536' - - --max-batch-prefill-tokens - - '4096' volumeMounts: - mountPath: /data name: model-volume diff --git a/ChatQnA/benchmark/oob/without_rerank/two_gaudi/oob_two_gaudi_without_rerank.yaml b/ChatQnA/benchmark/oob/without_rerank/two_gaudi/oob_two_gaudi_without_rerank.yaml index fa62ef84d7..a43553ddad 100644 --- a/ChatQnA/benchmark/oob/without_rerank/two_gaudi/oob_two_gaudi_without_rerank.yaml +++ b/ChatQnA/benchmark/oob/without_rerank/two_gaudi/oob_two_gaudi_without_rerank.yaml @@ -336,10 +336,6 @@ spec: - '2048' - --max-total-tokens - '4096' - - --max-batch-total-tokens - - '65536' - - --max-batch-prefill-tokens - - '4096' volumeMounts: - mountPath: /data name: model-volume