diff --git a/ggml-quants.c b/ggml-quants.c index 9cfd493b8d4720..dd2317e5dc2138 100644 --- a/ggml-quants.c +++ b/ggml-quants.c @@ -4596,18 +4596,18 @@ void ggml_vec_dot_q8_0_q8_0(int n, float * restrict s, size_t bs, const void * r #if defined(__ARM_FEATURE_MATMUL_INT8) if (nrc == 2) { - const block_q4_0 * restrict vx0 = vx; - const block_q4_0 * restrict vx1 = (const block_q4_0 *) ((const uint8_t*)vx + bx); + const block_q8_0 * restrict vx0 = vx; + const block_q8_0 * restrict vx1 = (const block_q8_0 *) ((const uint8_t*)vx + bx); const block_q8_0 * restrict vy0 = vy; const block_q8_0 * restrict vy1 = (const block_q8_0 *) ((const uint8_t*)vy + by); float32x4_t sumv0 = vdupq_n_f32(0.0f); for (int i = 0; i < nb; i++) { - const block_q4_0 * restrict b_x0 = &vx0[i]; + const block_q8_0 * restrict b_x0 = &vx0[i]; const block_q8_0 * restrict b_y0 = &vy0[i]; - const block_q4_0 * restrict b_x1 = &vx1[i]; + const block_q8_0 * restrict b_x1 = &vx1[i]; const block_q8_0 * restrict b_y1 = &vy1[i]; const int8x16_t x0_l = vld1q_s8((const int8_t*)b_x0->qs);