From 9f067acdb9bc3fd088aa361dad0201a85a4c0f43 Mon Sep 17 00:00:00 2001 From: Hansung Kim Date: Thu, 5 Sep 2024 19:55:36 -0700 Subject: [PATCH] sgemm_impl: Remove #if 0, FP_SIZE 16 --- tests/regression/sgemm_tcore/sgemm_impl.hpp | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/tests/regression/sgemm_tcore/sgemm_impl.hpp b/tests/regression/sgemm_tcore/sgemm_impl.hpp index 2014b507..ac07a666 100644 --- a/tests/regression/sgemm_tcore/sgemm_impl.hpp +++ b/tests/regression/sgemm_tcore/sgemm_impl.hpp @@ -6,7 +6,7 @@ #include "include/gemmini.h" #include "gemmini_mmio.h" -#define FP_SIZE 32 +#define FP_SIZE 16 // "fake" fp16 type that only has the correct data width. using float16_t = uint16_t; @@ -1038,7 +1038,6 @@ inline void thread_block_gemm(const T *A, const T *B, float *C, warps_per_threadblock_per_core); #endif -#if 0 // consumer code: SMEM->RF and compute // ---------------------------------------------------------------------- // @perf: this loop spills to stack a lot because of all the flws in @@ -1087,7 +1086,6 @@ inline void thread_block_gemm(const T *A, const T *B, float *C, threadblock_barrier(threadblock_id_in_cluster, warps_per_threadblock_per_core); -#endif } if constexpr (write_to_gmem) {