Skip to content

Commit 8c32b08

Browse files
authored
[Kernel] Fix awq error when n is not divisable by 128 (#13227)
1 parent 4108869 commit 8c32b08

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

csrc/quantization/awq/gemm_kernels.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -334,7 +334,7 @@ __global__ void __launch_bounds__(64)
334334
}
335335

336336
// TODO: Shang: Hoist loop invariance.
337-
for (int ax1_0_1 = 0; ax1_0_1 < 4; ++ax1_0_1) {
337+
for (int ax1_0_1 = 0; ax1_0_1 < (N / 32); ++ax1_0_1) {
338338
for (int local_id = 0; local_id < 8; ++local_id) {
339339
int row_offset = (((int)blockIdx_y) / j_factors1) * 16 +
340340
((int)threadIdx.x) / 4 + (local_id % 4) / 2 * 8;

0 commit comments

Comments
 (0)