Skip to content

Commit e238a68

Browse files
committed
Remove duplicate.
1 parent 32095b0 commit e238a68

File tree

2 files changed

+15
-22
lines changed

2 files changed

+15
-22
lines changed

kernel/power/sbgemv_common.c

Lines changed: 0 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -111,13 +111,6 @@ FORCEINLINE vec_f32 vec_loadNHi_mult(vec_bf16 *in, vec_f32 v_inp0, BLASLONG n, v
111111
return (v_inp0 * v_in00);
112112
}
113113

114-
FORCEINLINE vec_f32 vec_loadNHi_mult2(vec_f32 v_x0, vec_bf16 *in, BLASLONG n, vec_bf16 zero)
115-
{
116-
vec_f32 v_in00 = vec_loadNHi(in, n, zero);
117-
118-
return (v_x0 * v_in00);
119-
}
120-
121114
FORCEINLINE vec_f32 vec_loadNHi_vec(vec_bf16 *in, BLASLONG i, BLASLONG n, vec_bf16 zero)
122115
{
123116
return vec_loadNHi(&in[i], n, zero);

kernel/power/sbgemv_n_vsx.c

Lines changed: 15 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,7 @@ static void BF16GEMV_N_VSX_1(BLASLONG n, IFLOAT **ap, IFLOAT *xo, FLOAT *y, FLOA
8080
} else if (n) {
8181
vy0[0] = vec_loadN_f32(&v_y[(i * 2) + 0], n);
8282

83-
vy0[0] += vec_loadNHi_mult2(v_x0, &va0[i], n, zero);
83+
vy0[0] += vec_loadNHi_mult(&va0[i], v_x0, n, zero);
8484

8585
vec_storeN_f32(vy0[0], &v_y[(i * 2) + 0], n);
8686
}
@@ -131,8 +131,8 @@ static void BF16GEMV_N_VSX_2(BLASLONG n, IFLOAT **ap, IFLOAT *xo, FLOAT *y, FLOA
131131
} else if (n) {
132132
vy0[0] = vec_loadN_f32(&v_y[(i * 2) + 0], n);
133133

134-
vy0[0] += vec_loadNHi_mult2(v_x0, &va0[i], n, zero);
135-
vy0[0] += vec_loadNHi_mult2(v_x1, &va1[i], n, zero);
134+
vy0[0] += vec_loadNHi_mult(&va0[i], v_x0, n, zero);
135+
vy0[0] += vec_loadNHi_mult(&va1[i], v_x1, n, zero);
136136

137137
vec_storeN_f32(vy0[0], &v_y[(i * 2) + 0], n);
138138
}
@@ -193,10 +193,10 @@ static void BF16GEMV_N_VSX_4(BLASLONG n, IFLOAT **ap, IFLOAT *xo, FLOAT *y, FLOA
193193
} else if (n) {
194194
vy0[0] = vec_loadN_f32(&v_y[(i * 2) + 0], n);
195195

196-
vy0[0] += vec_loadNHi_mult2(v_x0, &va0[i], n, zero);
197-
vy0[0] += vec_loadNHi_mult2(v_x1, &va1[i], n, zero);
198-
vy0[0] += vec_loadNHi_mult2(v_x2, &va2[i], n, zero);
199-
vy0[0] += vec_loadNHi_mult2(v_x3, &va3[i], n, zero);
196+
vy0[0] += vec_loadNHi_mult(&va0[i], v_x0, n, zero);
197+
vy0[0] += vec_loadNHi_mult(&va1[i], v_x1, n, zero);
198+
vy0[0] += vec_loadNHi_mult(&va2[i], v_x2, n, zero);
199+
vy0[0] += vec_loadNHi_mult(&va3[i], v_x3, n, zero);
200200

201201
vec_storeN_f32(vy0[0], &v_y[(i * 2) + 0], n);
202202
}
@@ -281,14 +281,14 @@ static void BF16GEMV_N_VSX_8(BLASLONG n, IFLOAT **ap, IFLOAT *xo, FLOAT *y, BLAS
281281
} else if (n) {
282282
vy0[0] = vec_loadN_f32(&v_y[(i * 2) + 0], n);
283283

284-
vy0[0] += vec_loadNHi_mult2(v_x0, &va0[i], n, zero);
285-
vy0[0] += vec_loadNHi_mult2(v_x1, &va1[i], n, zero);
286-
vy0[0] += vec_loadNHi_mult2(v_x2, &va2[i], n, zero);
287-
vy0[0] += vec_loadNHi_mult2(v_x3, &va3[i], n, zero);
288-
vy0[0] += vec_loadNHi_mult2(v_x4, &vb0[i], n, zero);
289-
vy0[0] += vec_loadNHi_mult2(v_x5, &vb1[i], n, zero);
290-
vy0[0] += vec_loadNHi_mult2(v_x6, &vb2[i], n, zero);
291-
vy0[0] += vec_loadNHi_mult2(v_x7, &vb3[i], n, zero);
284+
vy0[0] += vec_loadNHi_mult(&va0[i], v_x0, n, zero);
285+
vy0[0] += vec_loadNHi_mult(&va1[i], v_x1, n, zero);
286+
vy0[0] += vec_loadNHi_mult(&va2[i], v_x2, n, zero);
287+
vy0[0] += vec_loadNHi_mult(&va3[i], v_x3, n, zero);
288+
vy0[0] += vec_loadNHi_mult(&vb0[i], v_x4, n, zero);
289+
vy0[0] += vec_loadNHi_mult(&vb1[i], v_x5, n, zero);
290+
vy0[0] += vec_loadNHi_mult(&vb2[i], v_x6, n, zero);
291+
vy0[0] += vec_loadNHi_mult(&vb3[i], v_x7, n, zero);
292292

293293
vec_storeN_f32(vy0[0], &v_y[(i * 2) + 0], n);
294294
}

0 commit comments

Comments
 (0)