Skip to content

Commit f6ffeb5

Browse files
committed
Fix issues with SSE3 version for vec_dot_q4_0_b16_q8_0_b16
1 parent 7912cb6 commit f6ffeb5

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml/src/ggml-quants.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4486,7 +4486,7 @@ void ggml_vec_dot_q4_0_b16_q8_0_b16(int n, float * restrict s, size_t bs, const
44864486
_mm_prefetch(&y[0] + sizeof(block_q8_0), _MM_HINT_T0);
44874487

44884488
// Compute combined scale for the block 0 and 1
4489-
const __m128 d_0_1 = _mm_set1_ps( GGML_BF16_TO_FP32(ggml_make_bf16(x[i].d)) * GGML_BF16_TO_FP32(ggml_make_bf16(y[i].d)));
4489+
const __m128 d_0_1 = _mm_set1_ps( GGML_BF16_TO_FP32(ggml_make_bf16(x[0].d)) * GGML_BF16_TO_FP32(ggml_make_bf16(y[0].d)));
44904490

44914491
const __m128i tmp_0_1 = _mm_loadu_si128((const __m128i *)x[0].qs);
44924492

0 commit comments

Comments
 (0)