Skip to content

Commit b12acc6

Browse files
committed
Merge remote-tracking branch 'quarticcat/master' into master2
# Conflicts: # exllama_ext/cuda_func/q4_matmul.cu
2 parents 93dbb26 + 8e37f2d commit b12acc6

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

exllama_ext/cuda_func/q4_matmul.cu

+2-2
Original file line numberDiff line numberDiff line change
@@ -8,10 +8,10 @@
88
#include "../hip_compat.cuh"
99
#endif
1010

11-
const int THREADS_X = 128; // Block size and thread count along columns in w and out
11+
const int THREADS_X = 32; // Block size and thread count along columns in w and out
1212
const int THREADS_Y = 1; // Block size and thread count along rows in x and out
1313

14-
const int GROUP_STEP = 128; // Assumed group size when block_size_z % groupsize != 0
14+
const int GROUP_STEP = 32; // Assumed group size when block_size_z % groupsize != 0
1515

1616
typedef void (*fp_q4_matmul_kernel)
1717
(

0 commit comments

Comments
 (0)