Skip to content

Commit 680f744

Browse files
authored
Merge pull request #108 from xianyi/develop
rebase
2 parents ab7f466 + 6f9460f commit 680f744

File tree

5 files changed

+14
-9
lines changed

5 files changed

+14
-9
lines changed

Diff for: Makefile.x86_64

+1-1
Original file line numberDiff line numberDiff line change
@@ -90,7 +90,7 @@ ifeq ($(F_COMPILER), GFORTRAN)
9090
GCCVERSIONGTEQ4 := $(shell expr `$(FC) -dumpversion | cut -f1 -d.` \>= 4)
9191
GCCVERSIONGTEQ5 := $(shell expr `$(FC) -dumpversion | cut -f1 -d.` \>= 5)
9292
GCCMINORVERSIONGTEQ7 := $(shell expr `$(FC) -dumpversion | cut -f2 -d.` \>= 7)
93-
GCCVERSIONCHECK := $(GCCVERSIONGTEQ5)$(GCCVERSIONGTEQ4)$(GCCVERSIONMINORGTEQ7)
93+
GCCVERSIONCHECK := $(GCCVERSIONGTEQ5)$(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ7)
9494
ifeq ($(GCCVERSIONCHECK), $(filter $(GCCVERSIONCHECK), 011 110 111))
9595
FCOMMON_OPT += -mavx2
9696
endif

Diff for: common_power.h

+2-2
Original file line numberDiff line numberDiff line change
@@ -844,8 +844,8 @@ Lmcount$lazy_ptr:
844844
#define BUFFER_SIZE ( 2 << 20)
845845
#elif defined(PPC440FP2)
846846
#define BUFFER_SIZE ( 16 << 20)
847-
#elif defined(POWER8) || defined(POWER9) || defined(POWER10)
848-
#define BUFFER_SIZE ( 64 << 20)
847+
#elif defined(POWER6) || defined(POWER8) || defined(POWER9) || defined(POWER10)
848+
#define BUFFER_SIZE ( 64 << 22)
849849
#else
850850
#define BUFFER_SIZE ( 16 << 20)
851851
#endif

Diff for: kernel/Makefile

+9-4
Original file line numberDiff line numberDiff line change
@@ -22,20 +22,25 @@ ifeq ($(C_COMPILER), CLANG)
2222
override CFLAGS += -fno-integrated-as
2323
endif
2424
endif
25+
2526
AVX2OPT =
2627
ifeq ($(C_COMPILER), GCC)
2728
# AVX2 support was added in 4.7.0
28-
GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
29-
GCCMINORVERSIONGTEQ7 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 7)
30-
ifeq ($(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ7), 11)
29+
GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
30+
GCCVERSIONGTEQ5 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 5)
31+
GCCMINORVERSIONGTEQ7 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 7)
32+
GCCVERSIONCHECK := $(GCCVERSIONGTEQ5)$(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ7)
33+
ifeq ($(GCCVERSIONCHECK), $(filter $(GCCVERSIONCHECK), 011 110 111))
3134
AVX2OPT = -mavx2
3235
endif
3336
endif
3437
ifeq ($(C_COMPILER), CLANG)
3538
# Any clang posing as gcc 4.2 should be new enough (3.4 or later)
3639
GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
40+
GCCVERSIONGTEQ5 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 5)
3741
GCCMINORVERSIONGTEQ2 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 2)
38-
ifeq ($(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ2), 11)
42+
GCCVERSIONCHECK := $(GCCVERSIONGTEQ5)$(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ7)
43+
ifeq ($(GCCVERSIONCHECK), $(filter $(GCCVERSIONCHECK), 011 110 111))
3944
AVX2OPT = -mavx2
4045
endif
4146
endif

Diff for: kernel/power/zgemv_t_4.c

+1-1
Original file line numberDiff line numberDiff line change
@@ -513,7 +513,7 @@ static void zgemv_kernel_4x1(BLASLONG n, FLOAT *ap, FLOAT *x, FLOAT *y, FLOAT al
513513

514514
#endif
515515

516-
static __attribute__((always_inline)) void copy_x(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_src) {
516+
static __attribute__((always_inline)) inline void copy_x(BLASLONG n, FLOAT *src, FLOAT *dest, BLASLONG inc_src) {
517517
BLASLONG i;
518518
for (i = 0; i < n; i++) {
519519
*dest = *src;

Diff for: lapack-netlib/LAPACKE/src/lapacke_zgesvdq.c

+1-1
Original file line numberDiff line numberDiff line change
@@ -71,7 +71,7 @@ lapack_int LAPACKE_zgesvdq( int matrix_layout, char joba, char jobp,
7171
goto exit_level_0;
7272
}
7373
liwork = iwork_query;
74-
lcwork = LAPACK_C2INT(cwork_query);
74+
lcwork = LAPACK_Z2INT(cwork_query);
7575
lrwork = (lapack_int)rwork_query;
7676
/* Allocate memory for work arrays */
7777
iwork = (lapack_int*)LAPACKE_malloc( sizeof(lapack_int) * liwork );

0 commit comments

Comments
 (0)