@@ -9921,6 +9921,8 @@ static void ggml_compute_forward_add(
9921
9921
case GGML_TYPE_Q4_K:
9922
9922
case GGML_TYPE_Q5_K:
9923
9923
case GGML_TYPE_Q6_K:
9924
+ case GGML_TYPE_TQ1_0:
9925
+ case GGML_TYPE_TQ2_0:
9924
9926
case GGML_TYPE_IQ2_XXS:
9925
9927
case GGML_TYPE_IQ2_XS:
9926
9928
case GGML_TYPE_IQ3_XXS:
@@ -10299,6 +10301,8 @@ static void ggml_compute_forward_add1(
10299
10301
case GGML_TYPE_Q4_K:
10300
10302
case GGML_TYPE_Q5_K:
10301
10303
case GGML_TYPE_Q6_K:
10304
+ case GGML_TYPE_TQ1_0:
10305
+ case GGML_TYPE_TQ2_0:
10302
10306
case GGML_TYPE_IQ2_XXS:
10303
10307
case GGML_TYPE_IQ2_XS:
10304
10308
case GGML_TYPE_IQ3_XXS:
@@ -10427,6 +10431,8 @@ static void ggml_compute_forward_acc(
10427
10431
case GGML_TYPE_Q4_K:
10428
10432
case GGML_TYPE_Q5_K:
10429
10433
case GGML_TYPE_Q6_K:
10434
+ case GGML_TYPE_TQ1_0:
10435
+ case GGML_TYPE_TQ2_0:
10430
10436
case GGML_TYPE_IQ2_XXS:
10431
10437
case GGML_TYPE_IQ2_XS:
10432
10438
case GGML_TYPE_IQ3_XXS:
@@ -10562,16 +10568,7 @@ static void ggml_compute_forward_mul_f32(
10562
10568
GGML_ASSERT( nb0 == sizeof(float));
10563
10569
GGML_ASSERT(nb00 == sizeof(float));
10564
10570
10565
- if (ggml_nelements(src1) == 1) {
10566
- float scale = ((float *) src1->data)[0];
10567
- for (int64_t ir = ith; ir < nr; ir += nth) {
10568
- if (dst->data != src0->data) {
10569
- // src0 is same shape as dst => same indices
10570
- memcpy((char *)dst->data + ir*nb1, (char *)src0->data + ir*nb01, ne0 * sizeof(float));
10571
- }
10572
- ggml_vec_scale_f32(ne0, (float *) ((char *) dst->data + ir*nb1), scale);
10573
- }
10574
- } else if (nb10 == sizeof(float)) {
10571
+ if (nb10 == sizeof(float)) {
10575
10572
for (int64_t ir = ith; ir < nr; ir += nth) {
10576
10573
// src0 and dst are same shape => same indices
10577
10574
const int64_t i03 = ir/(ne02*ne01);
@@ -13419,6 +13416,8 @@ static void ggml_compute_forward_out_prod(
13419
13416
case GGML_TYPE_Q4_K:
13420
13417
case GGML_TYPE_Q5_K:
13421
13418
case GGML_TYPE_Q6_K:
13419
+ case GGML_TYPE_TQ1_0:
13420
+ case GGML_TYPE_TQ2_0:
13422
13421
case GGML_TYPE_IQ2_XXS:
13423
13422
case GGML_TYPE_IQ2_XS:
13424
13423
case GGML_TYPE_IQ3_XXS:
@@ -13607,6 +13606,8 @@ static void ggml_compute_forward_set(
13607
13606
case GGML_TYPE_Q4_K:
13608
13607
case GGML_TYPE_Q5_K:
13609
13608
case GGML_TYPE_Q6_K:
13609
+ case GGML_TYPE_TQ1_0:
13610
+ case GGML_TYPE_TQ2_0:
13610
13611
case GGML_TYPE_IQ2_XXS:
13611
13612
case GGML_TYPE_IQ2_XS:
13612
13613
case GGML_TYPE_IQ3_XXS:
0 commit comments