Skip to content

Commit 7039770

Browse files
authored
[ZARCH] Undo the last commit
1 parent 11a43e8 commit 7039770

28 files changed

+987
-987
lines changed

kernel/zarch/damax.c

Lines changed: 17 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -33,27 +33,27 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
3333
static FLOAT damax_kernel_32(BLASLONG n, FLOAT *x) {
3434
FLOAT amax;
3535

36-
__asm__("vl %%v0,0(%[x]),3\n\t"
36+
__asm__("vl %%v0,0(%[x])\n\t"
3737
"srlg %[n],%[n],5\n\t"
3838
"xgr %%r1,%%r1\n\t"
3939
"0:\n\t"
4040
"pfd 1, 1024(%%r1,%[x])\n\t"
41-
"vl %%v16,0(%%r1,%[x]),3\n\t"
42-
"vl %%v17,16(%%r1,%[x]),3\n\t"
43-
"vl %%v18,32(%%r1,%[x]),3\n\t"
44-
"vl %%v19,48(%%r1,%[x]),3\n\t"
45-
"vl %%v20,64(%%r1,%[x]),3\n\t"
46-
"vl %%v21,80(%%r1,%[x]),3\n\t"
47-
"vl %%v22,96(%%r1,%[x]),3\n\t"
48-
"vl %%v23,112(%%r1,%[x]),3\n\t"
49-
"vl %%v24,128(%%r1,%[x]),3\n\t"
50-
"vl %%v25,144(%%r1,%[x]),3\n\t"
51-
"vl %%v26,160(%%r1,%[x]),3\n\t"
52-
"vl %%v27,176(%%r1,%[x]),3\n\t"
53-
"vl %%v28,192(%%r1,%[x]),3\n\t"
54-
"vl %%v29,208(%%r1,%[x]),3\n\t"
55-
"vl %%v30,224(%%r1,%[x]),3\n\t"
56-
"vl %%v31,240(%%r1,%[x]),3\n\t"
41+
"vl %%v16,0(%%r1,%[x])\n\t"
42+
"vl %%v17,16(%%r1,%[x])\n\t"
43+
"vl %%v18,32(%%r1,%[x])\n\t"
44+
"vl %%v19,48(%%r1,%[x])\n\t"
45+
"vl %%v20,64(%%r1,%[x])\n\t"
46+
"vl %%v21,80(%%r1,%[x])\n\t"
47+
"vl %%v22,96(%%r1,%[x])\n\t"
48+
"vl %%v23,112(%%r1,%[x])\n\t"
49+
"vl %%v24,128(%%r1,%[x])\n\t"
50+
"vl %%v25,144(%%r1,%[x])\n\t"
51+
"vl %%v26,160(%%r1,%[x])\n\t"
52+
"vl %%v27,176(%%r1,%[x])\n\t"
53+
"vl %%v28,192(%%r1,%[x])\n\t"
54+
"vl %%v29,208(%%r1,%[x])\n\t"
55+
"vl %%v30,224(%%r1,%[x])\n\t"
56+
"vl %%v31,240(%%r1,%[x])\n\t"
5757
"vfmaxdb %%v16,%%v16,%%v24,8\n\t"
5858
"vfmaxdb %%v17,%%v17,%%v25,8\n\t"
5959
"vfmaxdb %%v18,%%v18,%%v26,8\n\t"

kernel/zarch/damax_z13.c

Lines changed: 17 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -33,20 +33,20 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
3333
static FLOAT damax_kernel_32(BLASLONG n, FLOAT *x) {
3434
FLOAT amax;
3535

36-
__asm__("vl %%v0,0(%[x]),3\n\t"
36+
__asm__("vl %%v0,0(%[x])\n\t"
3737
"vflpdb %%v0,%%v0\n\t"
3838
"srlg %[n],%[n],5\n\t"
3939
"xgr %%r1,%%r1\n\t"
4040
"0:\n\t"
4141
"pfd 1, 1024(%%r1,%[x])\n\t"
42-
"vl %%v16,0(%%r1,%[x]),3\n\t"
43-
"vl %%v17,16(%%r1,%[x]),3\n\t"
44-
"vl %%v18,32(%%r1,%[x]),3\n\t"
45-
"vl %%v19,48(%%r1,%[x]),3\n\t"
46-
"vl %%v20,64(%%r1,%[x]),3\n\t"
47-
"vl %%v21,80(%%r1,%[x]),3\n\t"
48-
"vl %%v22,96(%%r1,%[x]),3\n\t"
49-
"vl %%v23,112(%%r1,%[x]),3\n\t"
42+
"vl %%v16,0(%%r1,%[x])\n\t"
43+
"vl %%v17,16(%%r1,%[x])\n\t"
44+
"vl %%v18,32(%%r1,%[x])\n\t"
45+
"vl %%v19,48(%%r1,%[x])\n\t"
46+
"vl %%v20,64(%%r1,%[x])\n\t"
47+
"vl %%v21,80(%%r1,%[x])\n\t"
48+
"vl %%v22,96(%%r1,%[x])\n\t"
49+
"vl %%v23,112(%%r1,%[x])\n\t"
5050
"vflpdb %%v16, %%v16\n\t"
5151
"vflpdb %%v17, %%v17\n\t"
5252
"vflpdb %%v18, %%v18\n\t"
@@ -71,14 +71,14 @@ static FLOAT damax_kernel_32(BLASLONG n, FLOAT *x) {
7171
"vsel %%v30,%%v28,%%v29,%%v30\n\t"
7272
"vfchdb %%v31,%%v30,%%v0\n\t"
7373
"vsel %%v0,%%v30,%%v0,%%v31\n\t"
74-
"vl %%v16,128(%%r1,%[x]),3\n\t"
75-
"vl %%v17,144(%%r1,%[x]),3\n\t"
76-
"vl %%v18,160(%%r1,%[x]),3\n\t"
77-
"vl %%v19,176(%%r1,%[x]),3\n\t"
78-
"vl %%v20,192(%%r1,%[x]),3\n\t"
79-
"vl %%v21,208(%%r1,%[x]),3\n\t"
80-
"vl %%v22,224(%%r1,%[x]),3\n\t"
81-
"vl %%v23,240(%%r1,%[x]),3\n\t"
74+
"vl %%v16,128(%%r1,%[x])\n\t"
75+
"vl %%v17,144(%%r1,%[x])\n\t"
76+
"vl %%v18,160(%%r1,%[x])\n\t"
77+
"vl %%v19,176(%%r1,%[x])\n\t"
78+
"vl %%v20,192(%%r1,%[x])\n\t"
79+
"vl %%v21,208(%%r1,%[x])\n\t"
80+
"vl %%v22,224(%%r1,%[x])\n\t"
81+
"vl %%v23,240(%%r1,%[x])\n\t"
8282
"vflpdb %%v16, %%v16\n\t"
8383
"vflpdb %%v17, %%v17\n\t"
8484
"vflpdb %%v18, %%v18\n\t"

kernel/zarch/damin.c

Lines changed: 17 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -33,27 +33,27 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
3333
static FLOAT damin_kernel_32(BLASLONG n, FLOAT *x) {
3434
FLOAT amin;
3535

36-
__asm__("vl %%v0,0(%[x]),3\n\t"
36+
__asm__("vl %%v0,0(%[x])\n\t"
3737
"srlg %[n],%[n],5\n\t"
3838
"xgr %%r1,%%r1\n\t"
3939
"0:\n\t"
4040
"pfd 1, 1024(%%r1,%[x])\n\t"
41-
"vl %%v16,0(%%r1,%[x]),3\n\t"
42-
"vl %%v17,16(%%r1,%[x]),3\n\t"
43-
"vl %%v18,32(%%r1,%[x]),3\n\t"
44-
"vl %%v19,48(%%r1,%[x]),3\n\t"
45-
"vl %%v20,64(%%r1,%[x]),3\n\t"
46-
"vl %%v21,80(%%r1,%[x]),3\n\t"
47-
"vl %%v22,96(%%r1,%[x]),3\n\t"
48-
"vl %%v23,112(%%r1,%[x]),3\n\t"
49-
"vl %%v24,128(%%r1,%[x]),3\n\t"
50-
"vl %%v25,144(%%r1,%[x]),3\n\t"
51-
"vl %%v26,160(%%r1,%[x]),3\n\t"
52-
"vl %%v27,176(%%r1,%[x]),3\n\t"
53-
"vl %%v28,192(%%r1,%[x]),3\n\t"
54-
"vl %%v29,208(%%r1,%[x]),3\n\t"
55-
"vl %%v30,224(%%r1,%[x]),3\n\t"
56-
"vl %%v31,240(%%r1,%[x]),3\n\t"
41+
"vl %%v16,0(%%r1,%[x])\n\t"
42+
"vl %%v17,16(%%r1,%[x])\n\t"
43+
"vl %%v18,32(%%r1,%[x])\n\t"
44+
"vl %%v19,48(%%r1,%[x])\n\t"
45+
"vl %%v20,64(%%r1,%[x])\n\t"
46+
"vl %%v21,80(%%r1,%[x])\n\t"
47+
"vl %%v22,96(%%r1,%[x])\n\t"
48+
"vl %%v23,112(%%r1,%[x])\n\t"
49+
"vl %%v24,128(%%r1,%[x])\n\t"
50+
"vl %%v25,144(%%r1,%[x])\n\t"
51+
"vl %%v26,160(%%r1,%[x])\n\t"
52+
"vl %%v27,176(%%r1,%[x])\n\t"
53+
"vl %%v28,192(%%r1,%[x])\n\t"
54+
"vl %%v29,208(%%r1,%[x])\n\t"
55+
"vl %%v30,224(%%r1,%[x])\n\t"
56+
"vl %%v31,240(%%r1,%[x])\n\t"
5757
"vfmindb %%v16,%%v16,%%v24,8\n\t"
5858
"vfmindb %%v17,%%v17,%%v25,8\n\t"
5959
"vfmindb %%v18,%%v18,%%v26,8\n\t"

kernel/zarch/damin_z13.c

Lines changed: 17 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -33,20 +33,20 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
3333
static FLOAT damin_kernel_32(BLASLONG n, FLOAT *x) {
3434
FLOAT amin;
3535

36-
__asm__("vl %%v0,0(%[x]),3\n\t"
36+
__asm__("vl %%v0,0(%[x])\n\t"
3737
"vflpdb %%v0,%%v0\n\t"
3838
"srlg %[n],%[n],5\n\t"
3939
"xgr %%r1,%%r1\n\t"
4040
"0:\n\t"
4141
"pfd 1, 1024(%%r1,%[x])\n\t"
42-
"vl %%v16,0(%%r1,%[x]),3\n\t"
43-
"vl %%v17,16(%%r1,%[x]),3\n\t"
44-
"vl %%v18,32(%%r1,%[x]),3\n\t"
45-
"vl %%v19,48(%%r1,%[x]),3\n\t"
46-
"vl %%v20,64(%%r1,%[x]),3\n\t"
47-
"vl %%v21,80(%%r1,%[x]),3\n\t"
48-
"vl %%v22,96(%%r1,%[x]),3\n\t"
49-
"vl %%v23,112(%%r1,%[x]),3\n\t"
42+
"vl %%v16,0(%%r1,%[x])\n\t"
43+
"vl %%v17,16(%%r1,%[x])\n\t"
44+
"vl %%v18,32(%%r1,%[x])\n\t"
45+
"vl %%v19,48(%%r1,%[x])\n\t"
46+
"vl %%v20,64(%%r1,%[x])\n\t"
47+
"vl %%v21,80(%%r1,%[x])\n\t"
48+
"vl %%v22,96(%%r1,%[x])\n\t"
49+
"vl %%v23,112(%%r1,%[x])\n\t"
5050
"vflpdb %%v16, %%v16\n\t"
5151
"vflpdb %%v17, %%v17\n\t"
5252
"vflpdb %%v18, %%v18\n\t"
@@ -71,14 +71,14 @@ static FLOAT damin_kernel_32(BLASLONG n, FLOAT *x) {
7171
"vsel %%v30,%%v28,%%v29,%%v30\n\t"
7272
"vfchdb %%v31,%%v0,%%v30\n\t"
7373
"vsel %%v0,%%v30,%%v0,%%v31\n\t"
74-
"vl %%v16,128(%%r1,%[x]),3\n\t"
75-
"vl %%v17,144(%%r1,%[x]),3\n\t"
76-
"vl %%v18,160(%%r1,%[x]),3\n\t"
77-
"vl %%v19,176(%%r1,%[x]),3\n\t"
78-
"vl %%v20,192(%%r1,%[x]),3\n\t"
79-
"vl %%v21,208(%%r1,%[x]),3\n\t"
80-
"vl %%v22,224(%%r1,%[x]),3\n\t"
81-
"vl %%v23,240(%%r1,%[x]),3\n\t"
74+
"vl %%v16,128(%%r1,%[x])\n\t"
75+
"vl %%v17,144(%%r1,%[x])\n\t"
76+
"vl %%v18,160(%%r1,%[x])\n\t"
77+
"vl %%v19,176(%%r1,%[x])\n\t"
78+
"vl %%v20,192(%%r1,%[x])\n\t"
79+
"vl %%v21,208(%%r1,%[x])\n\t"
80+
"vl %%v22,224(%%r1,%[x])\n\t"
81+
"vl %%v23,240(%%r1,%[x])\n\t"
8282
"vflpdb %%v16, %%v16\n\t"
8383
"vflpdb %%v17, %%v17\n\t"
8484
"vflpdb %%v18, %%v18\n\t"

kernel/zarch/dasum.c

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -45,14 +45,14 @@ static FLOAT dasum_kernel_32(BLASLONG n, FLOAT *x) {
4545
"xgr %%r1,%%r1\n\t"
4646
"0:\n\t"
4747
"pfd 1, 1024(%%r1,%[x])\n\t"
48-
"vl %%v16, 0(%%r1,%[x]),3\n\t"
49-
"vl %%v17, 16(%%r1,%[x]),3\n\t"
50-
"vl %%v18, 32(%%r1,%[x]),3\n\t"
51-
"vl %%v19, 48(%%r1,%[x]),3\n\t"
52-
"vl %%v20, 64(%%r1,%[x]),3\n\t"
53-
"vl %%v21, 80(%%r1,%[x]),3\n\t"
54-
"vl %%v22, 96(%%r1,%[x]),3\n\t"
55-
"vl %%v23, 112(%%r1,%[x]),3\n\t"
48+
"vl %%v16, 0(%%r1,%[x])\n\t"
49+
"vl %%v17, 16(%%r1,%[x])\n\t"
50+
"vl %%v18, 32(%%r1,%[x])\n\t"
51+
"vl %%v19, 48(%%r1,%[x])\n\t"
52+
"vl %%v20, 64(%%r1,%[x])\n\t"
53+
"vl %%v21, 80(%%r1,%[x])\n\t"
54+
"vl %%v22, 96(%%r1,%[x])\n\t"
55+
"vl %%v23, 112(%%r1,%[x])\n\t"
5656
"vflpdb %%v16, %%v16\n\t"
5757
"vflpdb %%v17, %%v17\n\t"
5858
"vflpdb %%v18, %%v18\n\t"
@@ -69,14 +69,14 @@ static FLOAT dasum_kernel_32(BLASLONG n, FLOAT *x) {
6969
"vfadb %%v29,%%v29,%%v21\n\t"
7070
"vfadb %%v30,%%v30,%%v22\n\t"
7171
"vfadb %%v31,%%v31,%%v23\n\t"
72-
"vl %%v16, 128(%%r1,%[x]),3\n\t"
73-
"vl %%v17, 144(%%r1,%[x]),3\n\t"
74-
"vl %%v18, 160(%%r1,%[x]),3\n\t"
75-
"vl %%v19, 176(%%r1,%[x]),3\n\t"
76-
"vl %%v20, 192(%%r1,%[x]),3\n\t"
77-
"vl %%v21, 208(%%r1,%[x]),3\n\t"
78-
"vl %%v22, 224(%%r1,%[x]),3\n\t"
79-
"vl %%v23, 240(%%r1,%[x]),3\n\t"
72+
"vl %%v16, 128(%%r1,%[x])\n\t"
73+
"vl %%v17, 144(%%r1,%[x])\n\t"
74+
"vl %%v18, 160(%%r1,%[x])\n\t"
75+
"vl %%v19, 176(%%r1,%[x])\n\t"
76+
"vl %%v20, 192(%%r1,%[x])\n\t"
77+
"vl %%v21, 208(%%r1,%[x])\n\t"
78+
"vl %%v22, 224(%%r1,%[x])\n\t"
79+
"vl %%v23, 240(%%r1,%[x])\n\t"
8080
"vflpdb %%v16, %%v16\n\t"
8181
"vflpdb %%v17, %%v17\n\t"
8282
"vflpdb %%v18, %%v18\n\t"

kernel/zarch/daxpy.c

Lines changed: 48 additions & 48 deletions
Original file line numberDiff line numberDiff line change
@@ -34,22 +34,22 @@ static void daxpy_kernel_32(BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha) {
3434
"0:\n\t"
3535
"pfd 1, 1024(%%r1,%[x])\n\t"
3636
"pfd 2, 1024(%%r1,%[y])\n\t"
37-
"vl %%v16,0(%%r1,%[x]),3\n\t"
38-
"vl %%v17,16(%%r1,%[x]),3\n\t"
39-
"vl %%v18,32(%%r1,%[x]),3\n\t"
40-
"vl %%v19,48(%%r1,%[x]),3\n\t"
41-
"vl %%v20,0(%%r1,%[y]),3\n\t"
42-
"vl %%v21,16(%%r1,%[y]),3\n\t"
43-
"vl %%v22,32(%%r1,%[y]),3\n\t"
44-
"vl %%v23,48(%%r1,%[y]),3\n\t"
45-
"vl %%v24,64(%%r1,%[x]),3\n\t"
46-
"vl %%v25,80(%%r1,%[x]),3\n\t"
47-
"vl %%v26,96(%%r1,%[x]),3\n\t"
48-
"vl %%v27,112(%%r1,%[x]),3\n\t"
49-
"vl %%v28,64(%%r1,%[y]),3\n\t"
50-
"vl %%v29,80(%%r1,%[y]),3\n\t"
51-
"vl %%v30,96(%%r1,%[y]),3\n\t"
52-
"vl %%v31,112(%%r1,%[y]),3\n\t"
37+
"vl %%v16,0(%%r1,%[x])\n\t"
38+
"vl %%v17,16(%%r1,%[x])\n\t"
39+
"vl %%v18,32(%%r1,%[x])\n\t"
40+
"vl %%v19,48(%%r1,%[x])\n\t"
41+
"vl %%v20,0(%%r1,%[y])\n\t"
42+
"vl %%v21,16(%%r1,%[y])\n\t"
43+
"vl %%v22,32(%%r1,%[y])\n\t"
44+
"vl %%v23,48(%%r1,%[y])\n\t"
45+
"vl %%v24,64(%%r1,%[x])\n\t"
46+
"vl %%v25,80(%%r1,%[x])\n\t"
47+
"vl %%v26,96(%%r1,%[x])\n\t"
48+
"vl %%v27,112(%%r1,%[x])\n\t"
49+
"vl %%v28,64(%%r1,%[y])\n\t"
50+
"vl %%v29,80(%%r1,%[y])\n\t"
51+
"vl %%v30,96(%%r1,%[y])\n\t"
52+
"vl %%v31,112(%%r1,%[y])\n\t"
5353
"vfmadb %%v16,%%v0,%%v16,%%v20\n\t"
5454
"vfmadb %%v17,%%v0,%%v17,%%v21\n\t"
5555
"vfmadb %%v18,%%v0,%%v18,%%v22\n\t"
@@ -58,30 +58,30 @@ static void daxpy_kernel_32(BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha) {
5858
"vfmadb %%v25,%%v0,%%v25,%%v29\n\t"
5959
"vfmadb %%v26,%%v0,%%v26,%%v30\n\t"
6060
"vfmadb %%v27,%%v0,%%v27,%%v31\n\t"
61-
"vst %%v16,0(%%r1,%[y]),3\n\t"
62-
"vst %%v17,16(%%r1,%[y]),3\n\t"
63-
"vst %%v18,32(%%r1,%[y]),3\n\t"
64-
"vst %%v19,48(%%r1,%[y]),3\n\t"
65-
"vst %%v24,64(%%r1,%[y]),3\n\t"
66-
"vst %%v25,80(%%r1,%[y]),3\n\t"
67-
"vst %%v26,96(%%r1,%[y]),3\n\t"
68-
"vst %%v27,112(%%r1,%[y]),3\n\t"
69-
"vl %%v16,128(%%r1,%[x]),3\n\t"
70-
"vl %%v17,144(%%r1,%[x]),3\n\t"
71-
"vl %%v18,160(%%r1,%[x]),3\n\t"
72-
"vl %%v19,176(%%r1,%[x]),3\n\t"
73-
"vl %%v20,128(%%r1,%[y]),3\n\t"
74-
"vl %%v21,144(%%r1,%[y]),3\n\t"
75-
"vl %%v22,160(%%r1,%[y]),3\n\t"
76-
"vl %%v23,176(%%r1,%[y]),3\n\t"
77-
"vl %%v24,192(%%r1,%[x]),3\n\t"
78-
"vl %%v25,208(%%r1,%[x]),3\n\t"
79-
"vl %%v26,224(%%r1,%[x]),3\n\t"
80-
"vl %%v27,240(%%r1,%[x]),3\n\t"
81-
"vl %%v28,192(%%r1,%[y]),3\n\t"
82-
"vl %%v29,208(%%r1,%[y]),3\n\t"
83-
"vl %%v30,224(%%r1,%[y]),3\n\t"
84-
"vl %%v31,240(%%r1,%[y]),3\n\t"
61+
"vst %%v16,0(%%r1,%[y])\n\t"
62+
"vst %%v17,16(%%r1,%[y])\n\t"
63+
"vst %%v18,32(%%r1,%[y])\n\t"
64+
"vst %%v19,48(%%r1,%[y])\n\t"
65+
"vst %%v24,64(%%r1,%[y])\n\t"
66+
"vst %%v25,80(%%r1,%[y])\n\t"
67+
"vst %%v26,96(%%r1,%[y])\n\t"
68+
"vst %%v27,112(%%r1,%[y])\n\t"
69+
"vl %%v16,128(%%r1,%[x])\n\t"
70+
"vl %%v17,144(%%r1,%[x])\n\t"
71+
"vl %%v18,160(%%r1,%[x])\n\t"
72+
"vl %%v19,176(%%r1,%[x])\n\t"
73+
"vl %%v20,128(%%r1,%[y])\n\t"
74+
"vl %%v21,144(%%r1,%[y])\n\t"
75+
"vl %%v22,160(%%r1,%[y])\n\t"
76+
"vl %%v23,176(%%r1,%[y])\n\t"
77+
"vl %%v24,192(%%r1,%[x])\n\t"
78+
"vl %%v25,208(%%r1,%[x])\n\t"
79+
"vl %%v26,224(%%r1,%[x])\n\t"
80+
"vl %%v27,240(%%r1,%[x])\n\t"
81+
"vl %%v28,192(%%r1,%[y])\n\t"
82+
"vl %%v29,208(%%r1,%[y])\n\t"
83+
"vl %%v30,224(%%r1,%[y])\n\t"
84+
"vl %%v31,240(%%r1,%[y])\n\t"
8585
"vfmadb %%v16,%%v0,%%v16,%%v20\n\t"
8686
"vfmadb %%v17,%%v0,%%v17,%%v21\n\t"
8787
"vfmadb %%v18,%%v0,%%v18,%%v22\n\t"
@@ -90,14 +90,14 @@ static void daxpy_kernel_32(BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha) {
9090
"vfmadb %%v25,%%v0,%%v25,%%v29\n\t"
9191
"vfmadb %%v26,%%v0,%%v26,%%v30\n\t"
9292
"vfmadb %%v27,%%v0,%%v27,%%v31\n\t"
93-
"vst %%v16,128(%%r1,%[y]),3\n\t"
94-
"vst %%v17,144(%%r1,%[y]),3\n\t"
95-
"vst %%v18,160(%%r1,%[y]),3\n\t"
96-
"vst %%v19,176(%%r1,%[y]),3\n\t"
97-
"vst %%v24,192(%%r1,%[y]),3\n\t"
98-
"vst %%v25,208(%%r1,%[y]),3\n\t"
99-
"vst %%v26,224(%%r1,%[y]),3\n\t"
100-
"vst %%v27,240(%%r1,%[y]),3\n\t"
93+
"vst %%v16,128(%%r1,%[y])\n\t"
94+
"vst %%v17,144(%%r1,%[y])\n\t"
95+
"vst %%v18,160(%%r1,%[y])\n\t"
96+
"vst %%v19,176(%%r1,%[y])\n\t"
97+
"vst %%v24,192(%%r1,%[y])\n\t"
98+
"vst %%v25,208(%%r1,%[y])\n\t"
99+
"vst %%v26,224(%%r1,%[y])\n\t"
100+
"vst %%v27,240(%%r1,%[y])\n\t"
101101
"agfi %%r1,256\n\t"
102102
"brctg %[n],0b"
103103
: "+m"(*(FLOAT (*)[n]) y),[n] "+&r"(n)

kernel/zarch/ddot.c

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -43,22 +43,22 @@ static FLOAT ddot_kernel_16(BLASLONG n, FLOAT *x, FLOAT *y) {
4343
"0:\n\t"
4444
"pfd 1,1024(%%r1,%[x])\n\t"
4545
"pfd 1,1024(%%r1,%[y])\n\t"
46-
"vl %%v16,0(%%r1,%[x]),3\n\t"
47-
"vl %%v17,16(%%r1,%[x]),3\n\t"
48-
"vl %%v18,32(%%r1,%[x]),3\n\t"
49-
"vl %%v19,48(%%r1,%[x]),3\n\t"
50-
"vl %%v20,64(%%r1,%[x]),3\n\t"
51-
"vl %%v21,80(%%r1,%[x]),3\n\t"
52-
"vl %%v22,96(%%r1,%[x]),3\n\t"
53-
"vl %%v23,112(%%r1,%[x]),3\n\t"
54-
"vl %%v24,0(%%r1,%[y]),3\n\t"
55-
"vl %%v25,16(%%r1,%[y]),3\n\t"
56-
"vl %%v26,32(%%r1,%[y]),3\n\t"
57-
"vl %%v27,48(%%r1,%[y]),3\n\t"
58-
"vl %%v28,64(%%r1,%[y]),3\n\t"
59-
"vl %%v29,80(%%r1,%[y]),3\n\t"
60-
"vl %%v30,96(%%r1,%[y]),3\n\t"
61-
"vl %%v31,112(%%r1,%[y]),3\n\t"
46+
"vl %%v16,0(%%r1,%[x])\n\t"
47+
"vl %%v17,16(%%r1,%[x])\n\t"
48+
"vl %%v18,32(%%r1,%[x])\n\t"
49+
"vl %%v19,48(%%r1,%[x])\n\t"
50+
"vl %%v20,64(%%r1,%[x])\n\t"
51+
"vl %%v21,80(%%r1,%[x])\n\t"
52+
"vl %%v22,96(%%r1,%[x])\n\t"
53+
"vl %%v23,112(%%r1,%[x])\n\t"
54+
"vl %%v24,0(%%r1,%[y])\n\t"
55+
"vl %%v25,16(%%r1,%[y])\n\t"
56+
"vl %%v26,32(%%r1,%[y])\n\t"
57+
"vl %%v27,48(%%r1,%[y])\n\t"
58+
"vl %%v28,64(%%r1,%[y])\n\t"
59+
"vl %%v29,80(%%r1,%[y])\n\t"
60+
"vl %%v30,96(%%r1,%[y])\n\t"
61+
"vl %%v31,112(%%r1,%[y])\n\t"
6262
"vfmadb %%v0,%%v16,%%v24,%%v0\n\t"
6363
"vfmadb %%v1,%%v17,%%v25,%%v1\n\t"
6464
"vfmadb %%v2,%%v18,%%v26,%%v2\n\t"

0 commit comments

Comments
 (0)