@@ -57,7 +57,7 @@ CAMAXKERNEL = zamax.S
5757ZAMAXKERNEL = zamax.S
5858
5959SAXPYKERNEL = axpy.S
60- DAXPYKERNEL = axpy .S
60+ DAXPYKERNEL = daxpy_thunderx2t99 .S
6161CAXPYKERNEL = zaxpy.S
6262ZAXPYKERNEL = zaxpy.S
6363
@@ -81,45 +81,35 @@ DGEMVTKERNEL = gemv_t.S
8181CGEMVTKERNEL = zgemv_t.S
8282ZGEMVTKERNEL = zgemv_t.S
8383
84-
85- SASUMKERNEL = asum.S
86- DASUMKERNEL = asum.S
87- CASUMKERNEL = casum.S
88- ZASUMKERNEL = zasum.S
89-
90- SCOPYKERNEL = copy.S
91- DCOPYKERNEL = copy.S
92- CCOPYKERNEL = copy.S
93- ZCOPYKERNEL = copy.S
94-
95- SSWAPKERNEL = swap.S
96- DSWAPKERNEL = swap.S
97- CSWAPKERNEL = swap.S
98- ZSWAPKERNEL = swap.S
99-
100- ISAMAXKERNEL = iamax.S
101- IDAMAXKERNEL = iamax.S
102- ICAMAXKERNEL = izamax.S
103- IZAMAXKERNEL = izamax.S
104-
105- SNRM2KERNEL = nrm2.S
106- DNRM2KERNEL = nrm2.S
107- CNRM2KERNEL = znrm2.S
108- ZNRM2KERNEL = znrm2.S
109-
110- DDOTKERNEL = dot.S
111- ifneq ($(C_COMPILER), PGI)
112- SDOTKERNEL = ../generic/dot.c
113- else
114- SDOTKERNEL = dot.S
115- endif
116- ifneq ($(C_COMPILER), PGI)
117- CDOTKERNEL = zdot.S
118- ZDOTKERNEL = zdot.S
119- else
120- CDOTKERNEL = ../arm/zdot.c
121- ZDOTKERNEL = ../arm/zdot.c
122- endif
84+ SASUMKERNEL = sasum_thunderx2t99.c
85+ DASUMKERNEL = dasum_thunderx2t99.c
86+ CASUMKERNEL = casum_thunderx2t99.c
87+ ZASUMKERNEL = zasum_thunderx2t99.c
88+
89+ SCOPYKERNEL = copy_thunderx2t99.c
90+ DCOPYKERNEL = copy_thunderx2t99.c
91+ CCOPYKERNEL = copy_thunderx2t99.c
92+ ZCOPYKERNEL = copy_thunderx2t99.c
93+
94+ SSWAPKERNEL = swap_thunderx2t99.S
95+ DSWAPKERNEL = swap_thunderx2t99.S
96+ CSWAPKERNEL = swap_thunderx2t99.S
97+ ZSWAPKERNEL = swap_thunderx2t99.S
98+
99+ ISAMAXKERNEL = iamax_thunderx2t99.c
100+ IDAMAXKERNEL = iamax_thunderx2t99.c
101+ ICAMAXKERNEL = izamax_thunderx2t99.c
102+ IZAMAXKERNEL = izamax_thunderx2t99.c
103+
104+ SNRM2KERNEL = scnrm2_thunderx2t99.c
105+ DNRM2KERNEL = dznrm2_thunderx2t99.c
106+ CNRM2KERNEL = scnrm2_thunderx2t99.c
107+ ZNRM2KERNEL = dznrm2_thunderx2t99.c
108+
109+ DDOTKERNEL = dot.c
110+ SDOTKERNEL = dot.c
111+ CDOTKERNEL = zdot_thunderx2t99.c
112+ ZDOTKERNEL = zdot_thunderx2t99.c
123113DSDOTKERNEL = dot.S
124114
125115DGEMM_BETA = dgemm_beta.S
@@ -128,10 +118,10 @@ SGEMM_BETA = sgemm_beta.S
128118SGEMMKERNEL = sgemm_kernel_sve_v2x$(SGEMM_UNROLL_N).S
129119STRMMKERNEL = strmm_kernel_sve_v1x$(SGEMM_UNROLL_N).S
130120
131- SGEMMINCOPY = sgemm_ncopy_sve_v1 .c
132- SGEMMITCOPY = sgemm_tcopy_sve_v1 .c
133- SGEMMONCOPY = sgemm_ncopy_$(DGEMM_UNROLL_N ).S
134- SGEMMOTCOPY = sgemm_tcopy_$(DGEMM_UNROLL_N ).S
121+ SGEMMINCOPY = gemm_ncopy_sve_v1x$(SGEMM_UNROLL_N) .c
122+ SGEMMITCOPY = gemm_tcopy_sve_v1x$(SGEMM_UNROLL_N) .c
123+ SGEMMONCOPY = sgemm_ncopy_$(SGEMM_UNROLL_N ).S
124+ SGEMMOTCOPY = sgemm_tcopy_$(SGEMM_UNROLL_N ).S
135125
136126SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
137127SGEMMITCOPYOBJ = sgemm_itcopy$(TSUFFIX).$(SUFFIX)
@@ -149,8 +139,8 @@ SSYMMLCOPY_M = symm_lcopy_sve.c
149139DGEMMKERNEL = dgemm_kernel_sve_v2x$(DGEMM_UNROLL_N).S
150140DTRMMKERNEL = dtrmm_kernel_sve_v1x$(DGEMM_UNROLL_N).S
151141
152- DGEMMINCOPY = dgemm_ncopy_sve_v1 .c
153- DGEMMITCOPY = dgemm_tcopy_sve_v1 .c
142+ DGEMMINCOPY = gemm_ncopy_sve_v1x$(DGEMM_UNROLL_N) .c
143+ DGEMMITCOPY = gemm_tcopy_sve_v1x$(DGEMM_UNROLL_N) .c
154144DGEMMONCOPY = dgemm_ncopy_$(DGEMM_UNROLL_N).S
155145DGEMMOTCOPY = dgemm_tcopy_$(DGEMM_UNROLL_N).S
156146
@@ -170,8 +160,8 @@ DSYMMLCOPY_M = symm_lcopy_sve.c
170160CGEMMKERNEL = cgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
171161CTRMMKERNEL = ctrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
172162
173- CGEMMINCOPY = cgemm_ncopy_sve_v1 .c
174- CGEMMITCOPY = cgemm_tcopy_sve_v1 .c
163+ CGEMMINCOPY = gemm_ncopy_complex_sve_v1x$(ZGEMM_UNROLL_N) .c
164+ CGEMMITCOPY = gemm_tcopy_complex_sve_v1x$(ZGEMM_UNROLL_N) .c
175165CGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
176166CGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
177167
@@ -194,8 +184,8 @@ CSYMMLCOPY_M = zsymm_lcopy_sve.c
194184ZGEMMKERNEL = zgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
195185ZTRMMKERNEL = ztrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
196186
197- ZGEMMINCOPY = zgemm_ncopy_sve_v1 .c
198- ZGEMMITCOPY = zgemm_tcopy_sve_v1 .c
187+ ZGEMMINCOPY = gemm_ncopy_complex_sve_v1x$(ZGEMM_UNROLL_N) .c
188+ ZGEMMITCOPY = gemm_tcopy_complex_sve_v1x$(ZGEMM_UNROLL_N) .c
199189ZGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
200190ZGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
201191
0 commit comments