tensor: Add ready signal to enforce 1 warp occupancy

Currently disabled as the timing behavior is already ~accurate
This commit is contained in:
Hansung Kim
2024-05-16 12:49:15 -07:00
parent 1a1094b2bb
commit 89e7d65926
4 changed files with 28 additions and 5 deletions

View File

@@ -347,7 +347,7 @@ void dpi_fmax(bool enable, int dst_fmt, int64_t a, int64_t b, int64_t* result, s
// A is M * K, B is K * M, C is M * M, D is M * M
#define M 4
#define K 2
#define K 2 // FIXME: 4x4x1 / cycle / octet!
// all row major
float c_A_tile[M][K];
@@ -551,7 +551,7 @@ void dpi_print_results(int wid, int octet, const svBitVecVal* A_tile, const svBi
}
steps[wid] += 1;
if (steps[wid] % 64 == 0) {
if (steps[wid] % 32 == 0) {
steps[wid] = 0;
std::cout << "warp " << wid << " finished wmma\n";
std::cout << "A tile" << "\n";