Skip to content

Commit

Permalink
ggml-cuda : use i and j instead of i0 and i in vec_dot_tq2_0_q8_1
Browse files Browse the repository at this point in the history
  • Loading branch information
compilade committed Jan 12, 2025
1 parent b6fc9f0 commit fbddb26
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions ggml/src/ggml-cuda/vecdotq.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -831,13 +831,13 @@ static __device__ __forceinline__ float vec_dot_tq2_0_q8_1(
}

#pragma unroll
for (int i0 = 0; i0 < QR2_0; ++i0) {
const block_q8_1 * bq8i = bq8_1 + bq8_offset + i0;
for (int i = 0; i < QR2_0; ++i) {
const block_q8_1 * bq8i = bq8_1 + bq8_offset + i;

for (int i = 0; i < VDR_TQ2_0_Q8_1_MMVQ; ++i) {
u[VDR_TQ2_0_Q8_1_MMVQ*i0 + i] = get_int_b4(bq8i->qs, (iqs % QI8_1) + i);
for (int j = 0; j < VDR_TQ2_0_Q8_1_MMVQ; ++j) {
u[VDR_TQ2_0_Q8_1_MMVQ*i + j] = get_int_b4(bq8i->qs, (iqs % QI8_1) + j);
}
d8[i0] = __low2float(bq8i->ds);
d8[i] = __low2float(bq8i->ds);
}

return vec_dot_tq2_0_q8_1_impl<VDR_TQ2_0_Q8_1_MMVQ>(v, u, btq2_0->d, d8);
Expand Down

0 comments on commit fbddb26

Please sign in to comment.