Skip to content

Commit 32095b0

Browse files
committed
Remove parameter.
1 parent c878820 commit 32095b0

File tree

2 files changed

+21
-21
lines changed

2 files changed

+21
-21
lines changed

kernel/power/sbgemv_common.c

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -58,9 +58,9 @@ FORCEINLINE vec_f32 vec_load_mult(vec_bf16 *in, vec_f32 *inp, vec_bf16 zero)
5858
return vec_mult(inp, in0, zero);
5959
}
6060

61-
FORCEINLINE void vec_load_vec2(vec_bf16 *in, BLASLONG i, vec_f32 *v_x0, vec_bf16 zero)
61+
FORCEINLINE void vec_load_vec2(vec_bf16 *in, vec_f32 *v_x0, vec_bf16 zero)
6262
{
63-
vec_bf16 inp = (vec_bf16)vec_load_vec(&in[i]);
63+
vec_bf16 inp = (vec_bf16)vec_load_vec(in);
6464

6565
v_x0[0] = BF16_HI(inp, zero);
6666
v_x0[1] = BF16_LO(inp, zero);
@@ -89,9 +89,9 @@ FORCEINLINE vec_f32 vec_loadN_mult(vec_bf16 *in, vec_f32 *inp, BLASLONG n, vec_b
8989
return vec_mult(inp, in0, zero);
9090
}
9191

92-
FORCEINLINE void vec_loadN_vec2(vec_bf16 *in, BLASLONG i, vec_f32 *v_x0, BLASLONG n, vec_bf16 zero)
92+
FORCEINLINE void vec_loadN_vec2(vec_bf16 *in, vec_f32 *v_x0, BLASLONG n, vec_bf16 zero)
9393
{
94-
vec_bf16 inp = vec_loadN(&in[i], n);
94+
vec_bf16 inp = vec_loadN(in, n);
9595

9696
v_x0[0] = BF16_HI(inp, zero);
9797
v_x0[1] = BF16_LO(inp, zero);

kernel/power/sbgemv_t_vsx.c

Lines changed: 17 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -55,14 +55,14 @@ static void BF16GEMV_T_VSX_1(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
5555
BLASLONG i = 0;
5656

5757
for (; i < n8; i++) {
58-
vec_load_vec2(v_x, i, inp, zero);
58+
vec_load_vec2(&v_x[i], inp, zero);
5959

6060
temp0 += vec_load_mult(&va0[i], inp, zero);
6161
}
6262

6363
n &= 7;
6464
if (n > 4) {
65-
vec_loadN_vec2(v_x, i, inp, n, zero);
65+
vec_loadN_vec2(&v_x[i], inp, n, zero);
6666

6767
temp0 += vec_loadN_mult(&va0[i], inp, n, zero);
6868
} else if (n) {
@@ -92,15 +92,15 @@ static void BF16GEMV_T_VSX_2(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
9292
BLASLONG i = 0;
9393

9494
for (; i < n8; i++) {
95-
vec_load_vec2(v_x, i, inp, zero);
95+
vec_load_vec2(&v_x[i], inp, zero);
9696

9797
temp0 += vec_load_mult(&va0[i], inp, zero);
9898
temp1 += vec_load_mult(&va1[i], inp, zero);
9999
}
100100

101101
n &= 7;
102102
if (n > 4) {
103-
vec_loadN_vec2(v_x, i, inp, n, zero);
103+
vec_loadN_vec2(&v_x[i], inp, n, zero);
104104

105105
temp0 += vec_loadN_mult(&va0[i], inp, n, zero);
106106
temp1 += vec_loadN_mult(&va1[i], inp, n, zero);
@@ -139,7 +139,7 @@ static void BF16GEMV_T_VSX_4(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
139139
BLASLONG i = 0;
140140

141141
for (; i < n8; i++) {
142-
vec_load_vec2(v_x, i, inp, zero);
142+
vec_load_vec2(&v_x[i], inp, zero);
143143

144144
temp0 += vec_load_mult(&va0[i], inp, zero);
145145
temp1 += vec_load_mult(&va1[i], inp, zero);
@@ -149,7 +149,7 @@ static void BF16GEMV_T_VSX_4(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
149149

150150
n &= 7;
151151
if (n > 4) {
152-
vec_loadN_vec2(v_x, i, inp, n, zero);
152+
vec_loadN_vec2(&v_x[i], inp, n, zero);
153153

154154
temp0 += vec_loadN_mult(&va0[i], inp, n, zero);
155155
temp1 += vec_loadN_mult(&va1[i], inp, n, zero);
@@ -220,7 +220,7 @@ static void BF16GEMV_T_VSX_8(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
220220
BLASLONG i = 0;
221221

222222
for (; i < n8; i++) {
223-
vec_load_vec2(v_x, i, inp, zero);
223+
vec_load_vec2(&v_x[i], inp, zero);
224224

225225
temp0 += vec_load_mult(&va0[i], inp, zero);
226226
temp1 += vec_load_mult(&va1[i], inp, zero);
@@ -234,7 +234,7 @@ static void BF16GEMV_T_VSX_8(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
234234

235235
n &= 7;
236236
if (n > 4) {
237-
vec_loadN_vec2(v_x, i, inp, n, zero);
237+
vec_loadN_vec2(&v_x[i], inp, n, zero);
238238

239239
temp0 += vec_loadN_mult(&va0[i], inp, n, zero);
240240
temp1 += vec_loadN_mult(&va1[i], inp, n, zero);
@@ -257,7 +257,7 @@ static void BF16GEMV_T_VSX_8(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
257257
temp7 += vec_loadNHi_mult(&va7[i], inp[0], n, zero);
258258
}
259259

260-
vec_f32 t0, t1, t2, t3;
260+
vec_f32 t0, t1, t2, t3, t10, t11, t12, t13;
261261
vec_f32 a = { alpha, alpha, alpha, alpha };
262262
vec_f32 b = { beta, beta, beta, beta };
263263
vec_f32 *v_y = (vec_f32 *) y;
@@ -272,14 +272,14 @@ static void BF16GEMV_T_VSX_8(BLASLONG n, BLASLONG lda, IFLOAT *ap, IFLOAT *x, FL
272272
temp3 = vec_mergel(t1, t3);
273273
temp0 += temp1 + temp2 + temp3;
274274

275-
t0 = vec_mergeh(temp4, temp6);
276-
t1 = vec_mergel(temp4, temp6);
277-
t2 = vec_mergeh(temp5, temp7);
278-
t3 = vec_mergel(temp5, temp7);
279-
temp4 = vec_mergeh(t0, t2);
280-
temp5 = vec_mergel(t0, t2);
281-
temp6 = vec_mergeh(t1, t3);
282-
temp7 = vec_mergel(t1, t3);
275+
t10 = vec_mergeh(temp4, temp6);
276+
t11 = vec_mergel(temp4, temp6);
277+
t12 = vec_mergeh(temp5, temp7);
278+
t13 = vec_mergel(temp5, temp7);
279+
temp4 = vec_mergeh(t10, t12);
280+
temp5 = vec_mergel(t10, t12);
281+
temp6 = vec_mergeh(t11, t13);
282+
temp7 = vec_mergel(t11, t13);
283283
temp4 += temp5 + temp6 + temp7;
284284

285285
vec_load_pair(inp, v_y);

0 commit comments

Comments
 (0)