Skip to content

Commit b3a5144

Browse files
authored
Merge pull request #4167 from Mousius/sve-zhemm-fix
Fix ZHEMM copy for SVE
2 parents 9ba9c8b + 730ca04 commit b3a5144

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

kernel/arm64/zhemm_ltcopy_sve.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,7 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON
8080
gat_ind = svadd_m(cmp, gat_ind, lda_vec);
8181
gat_ind = svadd_m(svnot_z(pg, cmp) , gat_ind, 2);
8282
if (offset <= 0) {
83-
svbool_t off_g = svwhilelt_b64((uint64_t)offset, (uint64_t)0LL);
83+
svbool_t off_g = svwhilelt_b64((int64_t)offset, (int64_t)0LL);
8484
data_vec_imag = svneg_m(data_vec_imag, off_g, data_vec_imag);
8585
}
8686

@@ -143,7 +143,7 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON
143143
gat_ind = svadd_m(cmp, gat_ind, lda_vec);
144144
gat_ind = svadd_m(svnot_z(pg, cmp) , gat_ind, 2);
145145
if (offset <= 0) {
146-
svbool_t off_g = svwhilelt_b32((uint32_t)offset, (uint32_t)0);
146+
svbool_t off_g = svwhilelt_b32((int32_t)offset, (int32_t)0);
147147
data_vec_imag = svneg_m(data_vec_imag, off_g, data_vec_imag);
148148
}
149149

kernel/arm64/zhemm_utcopy_sve.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -81,7 +81,7 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON
8181
gat_ind = svadd_m(svnot_z(pg, cmp) , gat_ind, lda_vec);
8282
data_vec_imag = svneg_z(pg, data_vec_imag);
8383
if (offset <= 0) {
84-
svbool_t off_g = svwhilelt_b64((uint64_t)offset, (uint64_t)0LL);
84+
svbool_t off_g = svwhilelt_b64((int64_t)offset, (int64_t)0LL);
8585
data_vec_imag = svneg_m(data_vec_imag, off_g, data_vec_imag);
8686
}
8787

@@ -143,7 +143,7 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON
143143
gat_ind = svadd_m(svnot_z(pg, cmp) , gat_ind, lda_vec);
144144
data_vec_imag = svneg_z(pg, data_vec_imag);
145145
if (offset <= 0) {
146-
svbool_t off_g = svwhilelt_b32((uint32_t)offset, (uint32_t)0);
146+
svbool_t off_g = svwhilelt_b32((int32_t)offset, (int32_t)0);
147147
data_vec_imag = svneg_m(data_vec_imag, off_g, data_vec_imag);
148148
}
149149

0 commit comments

Comments
 (0)