Skip to content

Commit

Permalink
Fix merge
Browse files Browse the repository at this point in the history
---------

Co-authored-by: ardfork <134447697+ardfork@users.noreply.github.com>
Co-authored-by: Kerfuffle <44031344+KerfuffleV2@users.noreply.github.com>
  • Loading branch information
3 people authored and YellowRoseCx committed Aug 10, 2023
1 parent f570b5c commit 9dba0c9
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions ggml-cuda.cu
Original file line number Diff line number Diff line change
Expand Up @@ -1641,8 +1641,8 @@ template <int vdr> static __device__ __forceinline__ float vec_dot_q8_1_q8_1_imp
#else
const float2 dm8f = __half22float2(dm8);
const float2 ds8f = __half22float2(ds8);
const float d8d8 = dm8f.x * ds8f.x;
const float m8s8 = dm8f.y * ds8f.y;
const float d8d8 = __low2float(dm8) * __low2float(ds8);
const float m8s8 = __high2float(dm8) * __high2float(ds8);
#endif // GGML_CUDA_F16

// scale second part of sum by QI8_1/ vdr to compensate for multiple threads adding it
Expand Down Expand Up @@ -3281,7 +3281,7 @@ static __global__ void mul_mat_q(
*dsi_dst = *dsi_src;
} else {
float * dfi_dst = (float *) dsi_dst;
*dfi_dst = (*dsi_src).x;
*dfi_dst = __low2half(*dsi_src);
}
}

Expand Down

0 comments on commit 9dba0c9

Please sign in to comment.