From 53093d1a0e049b32c142bd6f8aa4932b53609a56 Mon Sep 17 00:00:00 2001 From: Mahesh Doijade Date: Wed, 30 Nov 2022 22:12:10 +0530 Subject: [PATCH] switch mma instruction shape to 1684 from current 1688, as it is always faster than 1688 --- cpp/include/raft/distance/detail/pairwise_distance_gemm.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cpp/include/raft/distance/detail/pairwise_distance_gemm.h b/cpp/include/raft/distance/detail/pairwise_distance_gemm.h index ea9ed77fb5..8dcccfc14f 100644 --- a/cpp/include/raft/distance/detail/pairwise_distance_gemm.h +++ b/cpp/include/raft/distance/detail/pairwise_distance_gemm.h @@ -66,7 +66,7 @@ struct PairwiseDistanceGemm { /// Warp-level tile size (concept: GemmShape) // This code section describes the size of MMA op using InstructionShape = - cutlass::gemm::GemmShape<16, 8, 8>; // <- MMA Op tile M = 16, N = 8, K = 8 + cutlass::gemm::GemmShape<16, 8, 4>; // <- MMA Op tile M = 16, N = 8, K = 4 /// Operation performed by GEMM using Operator = cutlass::arch::OpMultiplyAddFastF32;