Skip to content

Commit 60e6c68

Browse files
committed
Adapt ARM architect
1 parent 1b1a757 commit 60e6c68

File tree

4 files changed

+6
-6
lines changed

4 files changed

+6
-6
lines changed

kernel/arm64/KERNEL.ARMV8

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -97,7 +97,7 @@ CNRM2KERNEL = znrm2.S
9797
ZNRM2KERNEL = znrm2.S
9898

9999
DDOTKERNEL = dot.S
100-
SDOTKERNEL = dot.S
100+
SDOTKERNEL = ../generic/dot.c
101101
CDOTKERNEL = zdot.S
102102
ZDOTKERNEL = zdot.S
103103
DSDOTKERNEL = dot.S

kernel/arm64/KERNEL.CORTEXA53

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -97,7 +97,7 @@ CNRM2KERNEL = znrm2.S
9797
ZNRM2KERNEL = znrm2.S
9898

9999
DDOTKERNEL = dot.S
100-
SDOTKERNEL = dot.S
100+
SDOTKERNEL = ../generic/dot.c
101101
CDOTKERNEL = zdot.S
102102
ZDOTKERNEL = zdot.S
103103
DSDOTKERNEL = dot.S

kernel/arm64/KERNEL.CORTEXA57

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@ DCOPYKERNEL = copy.S
7070
CCOPYKERNEL = copy.S
7171
ZCOPYKERNEL = copy.S
7272

73-
SDOTKERNEL = dot.S
73+
SDOTKERNEL = ../generic/dot.c
7474
DDOTKERNEL = dot.S
7575
CDOTKERNEL = zdot.S
7676
ZDOTKERNEL = zdot.S

kernel/generic/dot.c

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
2727

2828

2929
#include "common.h"
30-
30+
#include "../simd/intrin.h"
3131
#if defined(DSDOT)
3232
double CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y)
3333
#else
@@ -47,9 +47,9 @@ FLOAT CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y)
4747

4848
if ( (inc_x == 1) && (inc_y == 1) )
4949
{
50-
int n1 = n & -4;
50+
int n1 = n & -4;
5151
#if V_SIMD && !defined(DSDOT)
52-
const int vstep = v_nlanes_f32;
52+
const int vstep = v_nlanes_f32;
5353
const int unrollx4 = n & (-vstep * 4);
5454
const int unrollx = n & -vstep;
5555
v_f32 vsum0 = v_zero_f32();

0 commit comments

Comments
 (0)