Skip to content

Commit 01834ae

Browse files
authored
Merge pull request #29 from xianyi/develop
rebase
2 parents d92bd5b + 5e94aa4 commit 01834ae

10 files changed

Lines changed: 66 additions & 20 deletions

File tree

.drone.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -92,7 +92,7 @@ steps:
9292
- mkdir build && cd build
9393
- cmake $CMAKE_FLAGS ..
9494
- make -j
95-
- ctest
95+
- ctest -V
9696

9797
---
9898
kind: pipeline
@@ -116,7 +116,7 @@ steps:
116116
- mkdir build && cd build
117117
- cmake $CMAKE_FLAGS ..
118118
- make -j
119-
- ctest
119+
- ctest -V
120120

121121
---
122122
kind: pipeline
@@ -140,4 +140,4 @@ steps:
140140
- mkdir build && cd build
141141
- cmake $CMAKE_FLAGS ..
142142
- make -j
143-
- ctest
143+
- ctest -V

.gitignore

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -87,4 +87,5 @@ build.*
8787
*.swp
8888
benchmark/*.goto
8989
benchmark/smallscaling
90-
90+
CMakeCache.txt
91+
CMakeFiles/*

kernel/power/KERNEL.POWER8

Lines changed: 32 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -89,30 +89,52 @@ ZTRSMKERNEL_RT = ../generic/trsm_kernel_RT.c
8989
#SMINKERNEL = ../arm/min.c
9090
#DMINKERNEL = ../arm/min.c
9191
#
92-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
92+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
93+
ifneq ($(GCCVERSIONGTEQ9),1)
9394
ISAMAXKERNEL = isamax_power8.S
9495
else
9596
ISAMAXKERNEL = isamax.c
9697
endif
98+
else
99+
ISAMAXKERNEL = isamax.c
100+
endif
101+
#
97102
IDAMAXKERNEL = idamax.c
98-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
103+
#
104+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
105+
ifneq ($(GCCVERSIONGTEQ9),1)
99106
ICAMAXKERNEL = icamax_power8.S
100107
else
101108
ICAMAXKERNEL = icamax.c
102109
endif
110+
else
111+
ICAMAXKERNEL = icamax.c
112+
endif
113+
#
103114
IZAMAXKERNEL = izamax.c
104115
#
105-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
116+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
117+
ifneq ($(GCCVERSIONGTEQ9),1)
106118
ISAMINKERNEL = isamin_power8.S
107119
else
108120
ISAMINKERNEL = isamin.c
109121
endif
122+
else
123+
ISAMINKERNEL = isamin.c
124+
endif
125+
#
110126
IDAMINKERNEL = idamin.c
111-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
127+
#
128+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
129+
ifneq ($(GCCVERSIONGTEQ9),1)
112130
ICAMINKERNEL = icamin_power8.S
113131
else
114132
ICAMINKERNEL = icamin.c
115133
endif
134+
else
135+
ICAMINKERNEL = icamin.c
136+
endif
137+
#
116138
IZAMINKERNEL = izamin.c
117139
#
118140
#ISMAXKERNEL = ../arm/imax.c
@@ -128,11 +150,16 @@ ZASUMKERNEL = zasum.c
128150
#
129151
SAXPYKERNEL = saxpy.c
130152
DAXPYKERNEL = daxpy.c
131-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
153+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
154+
ifneq ($(GCCVERSIONGTEQ9),1)
132155
CAXPYKERNEL = caxpy_power8.S
133156
else
134157
CAXPYKERNEL = caxpy.c
135158
endif
159+
else
160+
CAXPYKERNEL = caxpy.c
161+
endif
162+
#
136163
ZAXPYKERNEL = zaxpy.c
137164
#
138165
SCOPYKERNEL = scopy.c

kernel/power/KERNEL.PPC440

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ ZASUMKERNEL = zasum_ppc440.S
1515

1616
SAXPYKERNEL = axpy_ppc440.S
1717
DAXPYKERNEL = axpy_ppc440.S
18-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
18+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
1919
CAXPYKERNEL = ../arm/zaxpy.c
2020
ZAXPYKERNEL = ../arm/zaxpy.c
2121
else
@@ -25,7 +25,7 @@ endif
2525

2626
SDOTKERNEL = dot_ppc440.S
2727
DDOTKERNEL = dot_ppc440.S
28-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
28+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
2929
CDOTKERNEL = zdot_ppc440.S
3030
ZDOTKERNEL = zdot_ppc440.S
3131
else
@@ -62,7 +62,7 @@ ZNRM2KERNEL = znrm2_ppc440.S
6262

6363
SROTKERNEL = rot_ppc440.S
6464
DROTKERNEL = rot_ppc440.S
65-
ifneq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
65+
ifneq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
6666
CROTKERNEL = zrot_ppc440.S
6767
ZROTKERNEL = zrot_ppc440.S
6868
else
@@ -132,7 +132,7 @@ ZTRSMKERNEL_LT = ztrsm_kernel_ppc440_LT.S
132132
ZTRSMKERNEL_RN = ztrsm_kernel_ppc440_LT.S
133133
ZTRSMKERNEL_RT = ztrsm_kernel_ppc440_RT.S
134134

135-
ifeq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
135+
ifeq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
136136
SGEMVNKERNEL = ../arm/gemv_n.c
137137
DGEMVNKERNEL = ../arm/gemv_n.c
138138
SGEMVTKERNEL = ../arm/gemv_t.c

kernel/power/KERNEL.PPC970

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
ifeq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
1+
ifeq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
22
SGEMMKERNEL = gemm_kernel.S
33
SGEMMINCOPY =
44
SGEMMITCOPY =
@@ -30,7 +30,7 @@ DGEMMITCOPYOBJ =
3030
DGEMMONCOPYOBJ = dgemm_oncopy$(TSUFFIX).$(SUFFIX)
3131
DGEMMOTCOPYOBJ = dgemm_otcopy$(TSUFFIX).$(SUFFIX)
3232

33-
ifeq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
33+
ifeq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
3434
CGEMMKERNEL = zgemm_kernel.S
3535
CGEMMINCOPY =
3636
CGEMMITCOPY =
@@ -72,7 +72,7 @@ ZTRSMKERNEL_LT = ztrsm_kernel_LT.S
7272
ZTRSMKERNEL_RN = ztrsm_kernel_LT.S
7373
ZTRSMKERNEL_RT = ztrsm_kernel_RT.S
7474

75-
ifeq ($(__BYTE_ORDER__),$(__ORDER_BIG_ENDIAN__))
75+
ifeq ($(__BYTE_ORDER__),"__ORDER_BIG_ENDIAN__")
7676
STRSMKERNEL_LN = trsm_kernel_LN.S
7777
STRSMKERNEL_LT = trsm_kernel_LT.S
7878
STRSMKERNEL_RN = trsm_kernel_LT.S

kernel/power/caxpy_power8.S

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,13 @@
1212

1313
PROLOGUE
1414

15+
#if _CALL_ELF ==2
16+
#ifdef CONJ
17+
caxpyc_k:
18+
#else
19+
caxpy_k:
20+
#endif
21+
#endif
1522
.LCF0:
1623
0: addis 2,12,.TOC.-.LCF0@ha
1724
addi 2,2,.TOC.-.LCF0@l

kernel/power/icamin_power8.S

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,9 @@
1010
#include "common.h"
1111

1212
PROLOGUE
13-
13+
#if _CALL_ELF ==2
14+
icamin_k:
15+
#endif
1416
.LCF0:
1517
0: addis 2,12,.TOC.-.LCF0@ha
1618
addi 2,2,.TOC.-.LCF0@l

kernel/power/isamax_power8.S

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,10 @@
1111
#include "common.h"
1212

1313
PROLOGUE
14-
14+
15+
#if _CALL_ELF == 2
16+
isamax_k:
17+
#endif
1518
.LCF0:
1619
0: addis 2,12,.TOC.-.LCF0@ha
1720
addi 2,2,.TOC.-.LCF0@l

kernel/power/isamin_power8.S

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,9 @@
1111

1212
PROLOGUE
1313

14+
#if _CALL_ELF ==2
15+
isamin_k:
16+
#endif
1417
.LCF0:
1518
0: addis 2,12,.TOC.-.LCF0@ha
1619
addi 2,2,.TOC.-.LCF0@l

lapack/CMakeLists.txt

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@ include_directories(${PROJECT_BINARY_DIR})
44

55

66
set(LAPACK_SOURCES
7-
getrf/getrf_single.c
87
potrf/potrf_U_single.c
98
potrf/potrf_L_single.c
109
lauum/lauum_U_single.c
@@ -45,6 +44,10 @@ GenerateNamedObjects("${LAPACK_MANGLED_SOURCES}" "" "" false "" "" false 3)
4544
GenerateNamedObjects("laswp/generic/laswp_k_4.c" "" "laswp_plus" false "" "" false 3)
4645
GenerateNamedObjects("laswp/generic/laswp_k_4.c" "MINUS" "laswp_minus" false "" "" false 3)
4746

47+
foreach (float_type ${FLOAT_TYPES})
48+
GenerateNamedObjects("getrf/getrf_single.c" "UNIT" "getrf_single" false "" "" false ${float_type})
49+
endforeach ()
50+
4851
# dynamic_arch laswp needs arch specific code ?
4952
#foreach(TARGET_CORE ${DYNAMIC_CORE})
5053
# set(TSUFFIX "_${TARGET_CORE}")
@@ -81,7 +84,7 @@ if (USE_THREAD)
8184
)
8285

8386
foreach (float_type ${FLOAT_TYPES})
84-
GenerateNamedObjects("${GETRF_SRC}" "" "getrf_parallel" false "" "" false ${float_type})
87+
GenerateNamedObjects("${GETRF_SRC}" "UNIT" "getrf_parallel" false "" "" false ${float_type})
8588
endforeach()
8689

8790
GenerateNamedObjects("${PARALLEL_SOURCES}")

0 commit comments

Comments
 (0)