@@ -102,7 +102,7 @@ gf_6vect_dot_prod_rvv:
102
102
sd s7, 56 (sp)
103
103
104
104
li t0, 0x0F
105
- vsetvli a5, x0, e8, m1
105
+ vsetvli a5, x0, e8, m1, ta, ma
106
106
107
107
/* initialize position */
108
108
li x_pos, 0
@@ -147,10 +147,9 @@ gf_6vect_dot_prod_rvv:
147
147
148
148
.Llooprvv_vl_vects:
149
149
/* load source data */
150
- add x_ptr,x_ptr,x_pos
150
+ add x_ptr, x_ptr, x_pos
151
151
vle8.v v_src, (x_ptr)
152
152
153
-
154
153
/* split 4-bit lo; 4-bit hi */
155
154
vand.vi v_src_lo, v_src, 0x0F
156
155
vsrl.vi v_src_hi, v_src, 4
@@ -167,7 +166,7 @@ gf_6vect_dot_prod_rvv:
167
166
addi x_tbl2, x_tbl2, 16
168
167
169
168
/* load next source pointer */
170
- addi x_vec_i, x_vec_i,8
169
+ addi x_vec_i, x_vec_i, 8
171
170
add a6, x_src, x_vec_i
172
171
ld x_ptr, 0 (a6)
173
172
@@ -238,12 +237,12 @@ gf_6vect_dot_prod_rvv:
238
237
vse8.v v_dest5, (x_dest5) # x_dest5
239
238
vse8.v v_dest6, (x_dest6) # x_dest6
240
239
241
- add x_dest1,x_dest1, a5
242
- add x_dest2,x_dest2, a5
243
- add x_dest3,x_dest3, a5
244
- add x_dest4,x_dest4, a5
245
- add x_dest5,x_dest5, a5
246
- add x_dest6,x_dest6, a5
240
+ add x_dest1, x_dest1, a5
241
+ add x_dest2, x_dest2, a5
242
+ add x_dest3, x_dest3, a5
243
+ add x_dest4, x_dest4, a5
244
+ add x_dest5, x_dest5, a5
245
+ add x_dest6, x_dest6, a5
247
246
248
247
/* increment position */
249
248
add x_pos, x_pos, a5
0 commit comments