From 1f51f7f9d44dd03048eccbdc6ecb265b549ee2c6 Mon Sep 17 00:00:00 2001 From: Hansung Kim Date: Sun, 8 Sep 2024 22:49:38 -0700 Subject: [PATCH] sgemm_impl: Mark threadblock_barrier convergent Thank you Chris Lattner --- tests/regression/sgemm_tcore/sgemm_impl.hpp | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/tests/regression/sgemm_tcore/sgemm_impl.hpp b/tests/regression/sgemm_tcore/sgemm_impl.hpp index 05692308..bf4ca80d 100644 --- a/tests/regression/sgemm_tcore/sgemm_impl.hpp +++ b/tests/regression/sgemm_tcore/sgemm_impl.hpp @@ -536,7 +536,8 @@ wmma_store(const int thread_in_warp, const int warp_col, const int warp_row, asm volatile ("wmma_store_finish_%=:" :: ); } -inline void threadblock_barrier(const uint32_t barrier_id, const uint32_t count) { +__attribute__((convergent)) inline void +threadblock_barrier(const uint32_t barrier_id, const uint32_t count) { vx_fence(); vx_barrier(barrier_id, count); }