minor update

This commit is contained in:
Blaise Tine
2023-11-27 02:04:22 -08:00
parent 11752b2562
commit 2f1171ca76
3 changed files with 44 additions and 41 deletions

View File

@@ -28,6 +28,9 @@ __kernel void matmul(__global float *A,
for (int j = 0; j < localSize; j++) {
sum += localA[localRow * localSize + j] * localB[j * localSize + localCol];
}
// Ensure computation is done before loading next block
barrier(CLK_LOCAL_MEM_FENCE);
}
C[globalRow * N + globalCol] = sum;