Skip to content

Commit 05a6f19

Browse files
authored
Fix loadSmemB iteration.
1 parent 5e59143 commit 05a6f19

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

examples/matmul/this-sm80/matmul-v00.cu

+2-2
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@ __device__ void loadSmemB(half *smem, half *B, int N, int K, int ko)
4343
int ty = threadIdx.y;
4444
int tz = threadIdx.z;
4545
int tid = tz * 64 + ty * 32 + tx;
46-
for (int i = 0; i < 64; ++i)
46+
for (int i = 0; i < 32; ++i)
4747
{
4848
int row = i * 4 + tid / 32;
4949
int col = tid % 32;
@@ -175,4 +175,4 @@ __global__ void matmul(half *A, half *B, half *C, int M, int N, int K, float alp
175175
storeAccum(SC, Accum);
176176
__syncthreads();
177177
storeSmemC(C, SC, M, N);
178-
}
178+
}

0 commit comments

Comments
 (0)