Skip to content

Commit dc6ac9e

Browse files
authored
Fix declaration of input arguments in the x86_64 s/dGEMV_T and s/dGEMV_N kernels
Arguments 0 and 1 need to be tagged as both input and output
1 parent 69edc5b commit dc6ac9e

File tree

4 files changed

+30
-30
lines changed

4 files changed

+30
-30
lines changed

kernel/x86_64/dgemv_n_4.c

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -111,9 +111,9 @@ static void dgemv_kernel_4x2( BLASLONG n, FLOAT **ap, FLOAT *x, FLOAT *y, FLOAT
111111
"jnz 1b \n\t"
112112

113113
:
114-
:
115-
"r" (i), // 0
116-
"r" (n), // 1
114+
"+r" (i), // 0
115+
"+r" (n) // 1
116+
:
117117
"r" (x), // 2
118118
"r" (y), // 3
119119
"r" (ap[0]), // 4
@@ -166,9 +166,9 @@ static void dgemv_kernel_4x1(BLASLONG n, FLOAT *ap, FLOAT *x, FLOAT *y, FLOAT *a
166166
"jnz 1b \n\t"
167167

168168
:
169+
"+r" (i), // 0
170+
"+r" (n) // 1
169171
:
170-
"r" (i), // 0
171-
"r" (n), // 1
172172
"r" (x), // 2
173173
"r" (y), // 3
174174
"r" (ap), // 4

kernel/x86_64/dgemv_t_4.c

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -127,9 +127,9 @@ static void dgemv_kernel_4x2(BLASLONG n, FLOAT *ap0, FLOAT *ap1, FLOAT *x, FLOAT
127127
"movsd %%xmm11,8(%2) \n\t"
128128

129129
:
130-
:
131-
"r" (i), // 0
132-
"r" (n), // 1
130+
"+r" (i), // 0
131+
"+r" (n) // 1
132+
:
133133
"r" (y), // 2
134134
"r" (ap0), // 3
135135
"r" (ap1), // 4
@@ -195,9 +195,9 @@ static void dgemv_kernel_4x1(BLASLONG n, FLOAT *ap, FLOAT *x, FLOAT *y)
195195
"movsd %%xmm10, (%2) \n\t"
196196

197197
:
198-
:
199-
"r" (i), // 0
200-
"r" (n), // 1
198+
"+r" (i), // 0
199+
"+r" (n) // 1
200+
:
201201
"r" (y), // 2
202202
"r" (ap), // 3
203203
"r" (x) // 4
@@ -259,9 +259,9 @@ static void add_y(BLASLONG n, FLOAT da , FLOAT *src, FLOAT *dest, BLASLONG inc_d
259259
"jnz 1b \n\t"
260260

261261
:
262-
:
263-
"r" (i), // 0
264-
"r" (n), // 1
262+
"+r" (i), // 0
263+
"+r" (n) // 1
264+
:
265265
"r" (&da), // 2
266266
"r" (src), // 3
267267
"r" (dest) // 4

kernel/x86_64/sgemv_n_4.c

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -149,9 +149,9 @@ static void sgemv_kernel_4x2( BLASLONG n, FLOAT **ap, FLOAT *x, FLOAT *y, FLOAT
149149
"jnz 1b \n\t"
150150

151151
:
152-
:
153-
"r" (i), // 0
154-
"r" (n), // 1
152+
"+r" (i), // 0
153+
"+r" (n) // 1
154+
:
155155
"r" (x), // 2
156156
"r" (y), // 3
157157
"r" (ap[0]), // 4
@@ -223,9 +223,9 @@ static void sgemv_kernel_4x1(BLASLONG n, FLOAT *ap, FLOAT *x, FLOAT *y, FLOAT *a
223223

224224
"3: \n\t"
225225
:
226+
"+r" (i), // 0
227+
"+r" (n1) // 1
226228
:
227-
"r" (i), // 0
228-
"r" (n1), // 1
229229
"r" (x), // 2
230230
"r" (y), // 3
231231
"r" (ap), // 4
@@ -277,9 +277,9 @@ static void add_y(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_dest)
277277
"jnz 1b \n\t"
278278

279279
:
280+
"+r" (i), // 0
281+
"+r" (n) // 1
280282
:
281-
"r" (i), // 0
282-
"r" (n), // 1
283283
"r" (src), // 2
284284
"r" (dest) // 3
285285
: "cc",

kernel/x86_64/sgemv_t_4.c

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -139,9 +139,9 @@ static void sgemv_kernel_4x2(BLASLONG n, FLOAT *ap0, FLOAT *ap1, FLOAT *x, FLOAT
139139
"movss %%xmm11,4(%2) \n\t"
140140

141141
:
142-
:
143-
"r" (i), // 0
144-
"r" (n), // 1
142+
"+r" (i), // 0
143+
"+r" (n) // 1
144+
:
145145
"r" (y), // 2
146146
"r" (ap0), // 3
147147
"r" (ap1), // 4
@@ -208,9 +208,9 @@ static void sgemv_kernel_4x1(BLASLONG n, FLOAT *ap, FLOAT *x, FLOAT *y)
208208
"movss %%xmm10, (%2) \n\t"
209209

210210
:
211-
:
212-
"r" (i), // 0
213-
"r" (n), // 1
211+
"+r" (i), // 0
212+
"+r" (n) // 1
213+
:
214214
"r" (y), // 2
215215
"r" (ap), // 3
216216
"r" (x) // 4
@@ -272,9 +272,9 @@ static void add_y(BLASLONG n, FLOAT da , FLOAT *src, FLOAT *dest, BLASLONG inc_d
272272
"jnz 1b \n\t"
273273

274274
:
275-
:
276-
"r" (i), // 0
277-
"r" (n), // 1
275+
"+r" (i), // 0
276+
"+r" (n) // 1
277+
:
278278
"r" (&da), // 2
279279
"r" (src), // 3
280280
"r" (dest) // 4

0 commit comments

Comments
 (0)