We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 34b0a08 commit e77094fCopy full SHA for e77094f
ggml-cuda.cu
@@ -6251,6 +6251,8 @@ static int64_t get_row_rounding(ggml_type type) {
6251
return max_compute_capability >= CC_RDNA2 ? 128 : 64;
6252
case GGML_TYPE_F16:
6253
return 1;
6254
+ case GGML_TYPE_F32:
6255
+ return 1;
6256
case GGML_TYPE_Q2_K:
6257
return max_compute_capability >= CC_RDNA2 ? 128 : 32;
6258
case GGML_TYPE_Q3_K:
@@ -6273,6 +6275,8 @@ static int64_t get_row_rounding(ggml_type type) {
6273
6275
return 64;
6274
6276
6277
6278
6279
6280
6281
6282
case GGML_TYPE_Q4_K:
0 commit comments