@@ -43,7 +43,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
43
43
#define betaV0 v11.d [ 0 ]
44
44
#define I x16
45
45
46
- #define size 128
46
+ #define prfm_size 640
47
+ #define calc_size 128
47
48
48
49
/ **************************************************************************************
49
50
* Macro definitions
@@ -119,27 +120,31 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
119
120
ldp q2 , q3 , [ A02 ]
120
121
ldp q4 , q5 , [ A03 ]
121
122
ldp q6 , q7 , [ A04 ]
122
-
123
+
123
124
fmul v0.2d , v0.2d , betaV0
124
125
fmul v1.2d , v1.2d , betaV0
125
-
126
+
126
127
fmul v2.2d , v2.2d , betaV0
127
128
fmul v3.2d , v3.2d , betaV0
128
-
129
+
130
+ prfm PLDL1KEEP , [ A01 , prfm_size ]
131
+
129
132
fmul v4.2d , v4.2d , betaV0
130
133
fmul v5.2d , v5.2d , betaV0
131
-
134
+
135
+ prfm PLDL1KEEP , [ A03 , prfm_size ]
136
+
132
137
fmul v6.2d , v6.2d , betaV0
133
138
fmul v7.2d , v7.2d , betaV0
134
139
135
140
st1 {v0.2d , v1.2d} , [ A01 ]
136
- add A01 , A01 , size
141
+ add A01 , A01 , calc_size
137
142
st1 {v2.2d , v3.2d} , [ A02 ]
138
- add A02 , A02 , size
143
+ add A02 , A02 , calc_size
139
144
st1 {v4.2d , v5.2d} , [ A03 ]
140
- add A03 , A03 , size
145
+ add A03 , A03 , calc_size
141
146
st1 {v6.2d , v7.2d} , [ A04 ]
142
- add A04 , A04 , size
147
+ add A04 , A04 , calc_size
143
148
144
149
subs I , I , # 1
145
150
bne .Lgemm_beta_03
0 commit comments