@@ -48,9 +48,9 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
48
48
#define VFADDVV_FLOAT __riscv_vfadd_vv_f64m4
49
49
#define VFIRSTM __riscv_vfirst_m_b16
50
50
#define UINT_V_T vuint64m4_t
51
- #define VIDV_MASK_UINT __riscv_vid_v_u64m4_m
51
+ #define VIDV_MASK_UINT __riscv_vid_v_u64m4_mu
52
52
#define VIDV_UINT __riscv_vid_v_u64m4
53
- #define VADDVX_MASK_UINT __riscv_vadd_vx_u64m4_m
53
+ #define VADDVX_MASK_UINT __riscv_vadd_vx_u64m4_mu
54
54
#define VADDVX_UINT __riscv_vadd_vx_u64m4
55
55
#define VMVVX_UINT __riscv_vmv_v_x_u64m4
56
56
#define VFMVFS_FLOAT_M1 __riscv_vfmv_f_s_f64m1_f64
@@ -77,9 +77,9 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
77
77
#define VFADDVV_FLOAT __riscv_vfadd_vv_f32m4
78
78
#define VFIRSTM __riscv_vfirst_m_b8
79
79
#define UINT_V_T vuint32m4_t
80
- #define VIDV_MASK_UINT __riscv_vid_v_u32m4_m
80
+ #define VIDV_MASK_UINT __riscv_vid_v_u32m4_mu
81
81
#define VIDV_UINT __riscv_vid_v_u32m4
82
- #define VADDVX_MASK_UINT __riscv_vadd_vx_u32m4_m
82
+ #define VADDVX_MASK_UINT __riscv_vadd_vx_u32m4_mu
83
83
#define VADDVX_UINT __riscv_vadd_vx_u32m4
84
84
#define VMVVX_UINT __riscv_vmv_v_x_u32m4
85
85
#define VFMVFS_FLOAT_M1 __riscv_vfmv_f_s_f32m1_f32
@@ -116,8 +116,8 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
116
116
117
117
//index where element greater than v_max
118
118
mask = VMFLTVV_FLOAT (v_max , vx0 , vl );
119
- v_max_index = VIDV_MASK_UINT (mask , vl );
120
- v_max_index = VADDVX_MASK_UINT (mask , v_max_index , j , vl );
119
+ v_max_index = VIDV_MASK_UINT (mask , v_max_index , vl );
120
+ v_max_index = VADDVX_MASK_UINT (mask , v_max_index , v_max_index , j , vl );
121
121
122
122
//update v_max and start_index j
123
123
v_max = VFMAXVV_FLOAT (v_max , vx0 , vl );
@@ -138,9 +138,9 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
138
138
139
139
//index where element greater than v_max
140
140
mask = VMFLTVV_FLOAT (v_max , vx0 , vl );
141
- v_max_index = VIDV_MASK_UINT (mask , vl );
142
- v_max_index = VADDVX_MASK_UINT (mask , v_max_index , j , vl );
143
-
141
+ v_max_index = VIDV_MASK_UINT (mask , v_max_index , vl );
142
+ v_max_index = VADDVX_MASK_UINT (mask , v_max_index , v_max_index , j , vl );
143
+
144
144
//update v_max and start_index j
145
145
v_max = VFMAXVV_FLOAT (v_max , vx0 , vl );
146
146
}
0 commit comments