File tree 1 file changed +3
-3
lines changed
1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -1641,8 +1641,8 @@ template <int vdr> static __device__ __forceinline__ float vec_dot_q8_1_q8_1_imp
1641
1641
#else
1642
1642
const float2 dm8f = __half22float2 (dm8);
1643
1643
const float2 ds8f = __half22float2 (ds8);
1644
- const float d8d8 = dm8f. x * ds8f. x ;
1645
- const float m8s8 = dm8f. y * ds8f. y ;
1644
+ const float d8d8 = __low2float (dm8) * __low2float (ds8) ;
1645
+ const float m8s8 = __high2float (dm8) * __high2float (ds8) ;
1646
1646
#endif // GGML_CUDA_F16
1647
1647
1648
1648
// scale second part of sum by QI8_1/ vdr to compensate for multiple threads adding it
@@ -3281,7 +3281,7 @@ static __global__ void mul_mat_q(
3281
3281
*dsi_dst = *dsi_src;
3282
3282
} else {
3283
3283
float * dfi_dst = (float *) dsi_dst;
3284
- *dfi_dst = (*dsi_src). x ;
3284
+ *dfi_dst = __low2half (*dsi_src);
3285
3285
}
3286
3286
}
3287
3287
You can’t perform that action at this time.
0 commit comments