From 30a4d15cde66a962b3071438b9214cc6e040f95d Mon Sep 17 00:00:00 2001 From: Hansung Kim Date: Sun, 8 Sep 2024 15:29:15 -0700 Subject: [PATCH] sgemm_impl: Parameterize BM on NUM_CORES --- tests/regression/sgemm_tcore/sgemm_impl.hpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/regression/sgemm_tcore/sgemm_impl.hpp b/tests/regression/sgemm_tcore/sgemm_impl.hpp index 7ba19992..d24c61d6 100644 --- a/tests/regression/sgemm_tcore/sgemm_impl.hpp +++ b/tests/regression/sgemm_tcore/sgemm_impl.hpp @@ -29,7 +29,7 @@ using float_type = float16_t; // (BM*BN) / (TM*TN) == threadblock size >= NT * CORES_PER_CLUSTER // * Combining BM * BK >= (BM*BN) / (TM*TN) == threadblock yields // BM <= BK*TM*TN -#define BM 128 +#define BM ((NUM_CORES == 8) ? 128 : 64) #define BN 64 #if (FP_SIZE == 32) #define BK 64