Compare commits
No commits in common. "c9s" and "c8" have entirely different histories.
@ -1 +0,0 @@
|
|||||||
1
|
|
29
.gitignore
vendored
29
.gitignore
vendored
@ -1,28 +1 @@
|
|||||||
/v0.2.5.tar.gz
|
SOURCES/v0.3.15.tar.gz
|
||||||
/v0.2.7.tar.gz
|
|
||||||
/v0.2.8.tar.gz
|
|
||||||
/v0.2.9.tar.gz
|
|
||||||
/v0.2.10.tar.gz
|
|
||||||
/v0.2.11.tar.gz
|
|
||||||
/v0.2.12.tar.gz
|
|
||||||
/v0.2.13.tar.gz
|
|
||||||
/v0.2.14.tar.gz
|
|
||||||
/v0.2.15.tar.gz
|
|
||||||
/v0.2.16.tar.gz
|
|
||||||
/openblas-0.2.17.tar.gz
|
|
||||||
/v0.2.18.tar.gz
|
|
||||||
/v0.2.19.tar.gz
|
|
||||||
/v0.3.0.tar.gz
|
|
||||||
/v0.3.1.tar.gz
|
|
||||||
/openblas-0.3.2.tar.gz
|
|
||||||
/openblas-0.3.6.tar.gz
|
|
||||||
/openblas-0.3.7.tar.gz
|
|
||||||
/openblas-0.3.8.tar.gz
|
|
||||||
/openblas-0.3.9.tar.gz
|
|
||||||
/openblas-0.3.10.tar.gz
|
|
||||||
/openblas-0.3.11.tar.gz
|
|
||||||
/openblas-0.3.12.tar.gz
|
|
||||||
/openblas-0.3.13.tar.gz
|
|
||||||
/openblas-0.3.15.tar.gz
|
|
||||||
/openblas-0.3.21.tar.gz
|
|
||||||
/OpenBLAS-0.3.26.tar.gz
|
|
||||||
|
1
.openblas.metadata
Normal file
1
.openblas.metadata
Normal file
@ -0,0 +1 @@
|
|||||||
|
d7d1f67c1ef0c14c93761bdf44f0da8d0dd4bc0f SOURCES/v0.3.15.tar.gz
|
6964
SOURCES/openblas-0.3.15-asmflags.patch
Normal file
6964
SOURCES/openblas-0.3.15-asmflags.patch
Normal file
File diff suppressed because it is too large
Load Diff
@ -1,7 +1,8 @@
|
|||||||
diff -up OpenBLAS-0.2.5/Makefile.system.orig OpenBLAS-0.2.5/Makefile.system
|
diff --git a/Makefile.system b/Makefile.system
|
||||||
--- OpenBLAS-0.2.5/Makefile.system.orig 2012-11-27 01:24:53.000000000 +0200
|
index ae703e4d..80739dc4 100644
|
||||||
+++ OpenBLAS-0.2.5/Makefile.system 2012-12-24 16:13:57.316689688 +0200
|
--- a/Makefile.system
|
||||||
@@ -758,16 +758,16 @@ ifndef SMP
|
+++ b/Makefile.system
|
||||||
|
@@ -1515,16 +1515,16 @@ ifndef SMP
|
||||||
LIBNAME = $(LIBPREFIX)_$(LIBCORE)$(REVISION).$(LIBSUFFIX)
|
LIBNAME = $(LIBPREFIX)_$(LIBCORE)$(REVISION).$(LIBSUFFIX)
|
||||||
LIBNAME_P = $(LIBPREFIX)_$(LIBCORE)$(REVISION)_p.$(LIBSUFFIX)
|
LIBNAME_P = $(LIBPREFIX)_$(LIBCORE)$(REVISION)_p.$(LIBSUFFIX)
|
||||||
else
|
else
|
47
SOURCES/openblas-0.3.15-noopt.patch
Normal file
47
SOURCES/openblas-0.3.15-noopt.patch
Normal file
@ -0,0 +1,47 @@
|
|||||||
|
diff --git a/lapack-netlib/INSTALL/Makefile b/lapack-netlib/INSTALL/Makefile
|
||||||
|
index 1007c1bc..348b8d60 100644
|
||||||
|
--- a/lapack-netlib/INSTALL/Makefile
|
||||||
|
+++ b/lapack-netlib/INSTALL/Makefile
|
||||||
|
@@ -46,5 +46,5 @@ cleanexe:
|
||||||
|
cleantest:
|
||||||
|
rm -f core
|
||||||
|
|
||||||
|
-slamch.o: slamch.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
-dlamch.o: dlamch.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
+slamch.o: slamch.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
+dlamch.o: dlamch.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
diff --git a/lapack-netlib/SRC/Makefile b/lapack-netlib/SRC/Makefile
|
||||||
|
index 83baac87..bc42e82d 100644
|
||||||
|
--- a/lapack-netlib/SRC/Makefile
|
||||||
|
+++ b/lapack-netlib/SRC/Makefile
|
||||||
|
@@ -643,9 +643,9 @@ cleanobj:
|
||||||
|
cleanlib:
|
||||||
|
rm -f $(LAPACKLIB)
|
||||||
|
|
||||||
|
-slaruv.o: slaruv.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
-dlaruv.o: dlaruv.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
-sla_wwaddw.o: sla_wwaddw.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
-dla_wwaddw.o: dla_wwaddw.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
-cla_wwaddw.o: cla_wwaddw.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
-zla_wwaddw.o: zla_wwaddw.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
+slaruv.o: slaruv.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
+dlaruv.o: dlaruv.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
+sla_wwaddw.o: sla_wwaddw.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
+dla_wwaddw.o: dla_wwaddw.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
+cla_wwaddw.o: cla_wwaddw.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
+zla_wwaddw.o: zla_wwaddw.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
diff --git a/lapack-netlib/TESTING/MATGEN/Makefile b/lapack-netlib/TESTING/MATGEN/Makefile
|
||||||
|
index e21ebd6c..8582e944 100644
|
||||||
|
--- a/lapack-netlib/TESTING/MATGEN/Makefile
|
||||||
|
+++ b/lapack-netlib/TESTING/MATGEN/Makefile
|
||||||
|
@@ -110,8 +110,8 @@ cleanlib:
|
||||||
|
rm -f $(TMGLIB)
|
||||||
|
|
||||||
|
ifeq ($(filter $(BUILD_SINGLE) $(BUILD_COMPLEX),1),)
|
||||||
|
-slaran.o: slaran.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
+slaran.o: slaran.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
endif
|
||||||
|
ifeq ($(filter $(BUILD_DOUBLE) $(BUILD_COMPLEX16),1),)
|
||||||
|
-dlaran.o: dlaran.f ; $(FC) $(FFLAGS_NOOPT) -c -o $@ $<
|
||||||
|
+dlaran.o: dlaran.f ; $(FC) $(FFLAGS) -c -o $@ $<
|
||||||
|
endif
|
39
SOURCES/openblas-0.3.15-power-optimize.patch
Normal file
39
SOURCES/openblas-0.3.15-power-optimize.patch
Normal file
@ -0,0 +1,39 @@
|
|||||||
|
diff --git a/kernel/power/drot.c b/kernel/power/drot.c
|
||||||
|
index 3229878e..a25ccceb 100644
|
||||||
|
--- a/kernel/power/drot.c
|
||||||
|
+++ b/kernel/power/drot.c
|
||||||
|
@@ -37,8 +37,6 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
|
#include "common.h"
|
||||||
|
|
||||||
|
-#pragma GCC optimize "O1"
|
||||||
|
-
|
||||||
|
#if defined(__VEC__) || defined(__ALTIVEC__)
|
||||||
|
#if defined(POWER8) || defined(POWER9)
|
||||||
|
#include "drot_microk_power8.c"
|
||||||
|
diff --git a/kernel/power/srot.c b/kernel/power/srot.c
|
||||||
|
index 5a0d4b12..d73fafc9 100644
|
||||||
|
--- a/kernel/power/srot.c
|
||||||
|
+++ b/kernel/power/srot.c
|
||||||
|
@@ -37,8 +37,6 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
|
#include "common.h"
|
||||||
|
|
||||||
|
-#pragma GCC optimize "O1"
|
||||||
|
-
|
||||||
|
#if defined(__VEC__) || defined(__ALTIVEC__)
|
||||||
|
#if defined(POWER8) || defined(POWER9)
|
||||||
|
#include "srot_microk_power8.c"
|
||||||
|
diff --git a/kernel/power/zscal.c b/kernel/power/zscal.c
|
||||||
|
index 59ddc149..a5e35001 100644
|
||||||
|
--- a/kernel/power/zscal.c
|
||||||
|
+++ b/kernel/power/zscal.c
|
||||||
|
@@ -36,8 +36,6 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
|
#include "common.h"
|
||||||
|
|
||||||
|
-#pragma GCC optimize "O1"
|
||||||
|
-
|
||||||
|
#if defined(__VEC__) || defined(__ALTIVEC__)
|
||||||
|
#if defined(POWER8) || defined(POWER9)
|
||||||
|
#if defined(DOUBLE)
|
@ -1,20 +1,27 @@
|
|||||||
diff -up OpenBLAS-0.2.15/Makefile.system_lapack OpenBLAS-0.2.15/Makefile
|
diff --git a/Makefile b/Makefile
|
||||||
--- OpenBLAS-0.2.15/Makefile.system_lapack 2015-10-27 13:44:50.000000000 -0700
|
index e113026..ae8f7de 100644
|
||||||
+++ OpenBLAS-0.2.15/Makefile 2015-10-28 09:14:56.696685503 -0700
|
--- a/Makefile
|
||||||
@@ -16,11 +16,7 @@ BLASDIRS += reference
|
+++ b/Makefile
|
||||||
|
@@ -12,9 +12,6 @@ BLASDIRS += reference
|
||||||
endif
|
endif
|
||||||
|
|
||||||
SUBDIRS = $(BLASDIRS)
|
SUBDIRS = $(BLASDIRS)
|
||||||
-ifneq ($(NO_LAPACK), 1)
|
-ifneq ($(NO_LAPACK), 1)
|
||||||
-SUBDIRS += lapack
|
-SUBDIRS += lapack
|
||||||
-endif
|
-endif
|
||||||
-
|
|
||||||
|
RELA =
|
||||||
|
ifeq ($(BUILD_RELAPACK), 1)
|
||||||
|
@@ -32,8 +29,6 @@ export NOFORTRAN
|
||||||
|
export NO_LAPACK
|
||||||
|
endif
|
||||||
|
|
||||||
-LAPACK_NOOPT := $(filter-out -O0 -O1 -O2 -O3 -Ofast,$(LAPACK_FFLAGS))
|
-LAPACK_NOOPT := $(filter-out -O0 -O1 -O2 -O3 -Ofast,$(LAPACK_FFLAGS))
|
||||||
+SUBDIRS += lapack
|
-
|
||||||
|
SUBDIRS_ALL = $(SUBDIRS) test ctest utest exports benchmark ../laswp ../bench cpp_thread_test
|
||||||
|
|
||||||
SUBDIRS_ALL = $(SUBDIRS) test ctest utest exports benchmark ../laswp ../bench
|
.PHONY : all libs netlib $(RELA) test ctest shared install
|
||||||
|
@@ -235,76 +230,8 @@ hpl_p :
|
||||||
@@ -211,57 +207,8 @@ hpl_p :
|
|
||||||
fi; \
|
fi; \
|
||||||
done
|
done
|
||||||
|
|
||||||
@ -23,7 +30,7 @@ diff -up OpenBLAS-0.2.15/Makefile.system_lapack OpenBLAS-0.2.15/Makefile
|
|||||||
-
|
-
|
||||||
-else
|
-else
|
||||||
-netlib : lapack_prebuild
|
-netlib : lapack_prebuild
|
||||||
-ifndef NOFORTRAN
|
-ifeq ($(NOFORTRAN), $(filter 0,$(NOFORTRAN)))
|
||||||
- @$(MAKE) -C $(NETLIB_LAPACK_DIR) lapacklib
|
- @$(MAKE) -C $(NETLIB_LAPACK_DIR) lapacklib
|
||||||
- @$(MAKE) -C $(NETLIB_LAPACK_DIR) tmglib
|
- @$(MAKE) -C $(NETLIB_LAPACK_DIR) tmglib
|
||||||
-endif
|
-endif
|
||||||
@ -32,34 +39,49 @@ diff -up OpenBLAS-0.2.15/Makefile.system_lapack OpenBLAS-0.2.15/Makefile
|
|||||||
-endif
|
-endif
|
||||||
-endif
|
-endif
|
||||||
-
|
-
|
||||||
|
-ifeq ($(NO_LAPACK), 1)
|
||||||
|
-re_lapack :
|
||||||
|
-
|
||||||
|
-else
|
||||||
|
-re_lapack :
|
||||||
|
- @$(MAKE) -C relapack
|
||||||
|
-endif
|
||||||
|
-
|
||||||
-prof_lapack : lapack_prebuild
|
-prof_lapack : lapack_prebuild
|
||||||
- @$(MAKE) -C $(NETLIB_LAPACK_DIR) lapack_prof
|
- @$(MAKE) -C $(NETLIB_LAPACK_DIR) lapack_prof
|
||||||
-
|
-
|
||||||
-lapack_prebuild :
|
-lapack_prebuild :
|
||||||
-ifndef NOFORTRAN
|
-ifeq ($(NOFORTRAN), $(filter 0,$(NOFORTRAN)))
|
||||||
- -@echo "FORTRAN = $(FC)" > $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "FC = $(FC)" > $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "OPTS = $(LAPACK_FFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "FFLAGS = $(LAPACK_FFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
|
- -@echo "FFLAGS_DRV = $(LAPACK_FFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "POPTS = $(LAPACK_FPFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "POPTS = $(LAPACK_FPFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "NOOPT = -O0 $(LAPACK_NOOPT)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "FFLAGS_NOOPT = -O0 $(LAPACK_NOOPT)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "PNOOPT = $(LAPACK_FPFLAGS) -O0" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "PNOOPT = $(LAPACK_FPFLAGS) -O0" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "LOADOPTS = $(FFLAGS) $(EXTRALIB)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "LDFLAGS = $(FFLAGS) $(EXTRALIB)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "CC = $(CC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "CC = $(CC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "override CFLAGS = $(LAPACK_CFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "override CFLAGS = $(LAPACK_CFLAGS)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "ARCH = $(AR)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "AR = $(AR)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "ARCHFLAGS = -ru" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "ARFLAGS = $(ARFLAGS) -ru" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "RANLIB = $(RANLIB)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "RANLIB = $(RANLIB)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "LAPACKLIB = ../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "LAPACKLIB = ../../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "TMGLIB = ../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "TMGLIB = ../../../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "BLASLIB = ../../../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "BLASLIB = ../../../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "LAPACKELIB = ../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "LAPACKELIB = ../../../$(LIBNAME)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "LAPACKLIB_P = ../$(LIBNAME_P)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "LAPACKLIB_P = ../$(LIBNAME_P)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "SUFFIX = $(SUFFIX)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "SUFFIX = $(SUFFIX)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "PSUFFIX = $(PSUFFIX)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "PSUFFIX = $(PSUFFIX)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "CEXTRALIB = $(EXTRALIB)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "CEXTRALIB = $(EXTRALIB)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
-ifeq ($(FC), gfortran)
|
-ifeq ($(F_COMPILER), GFORTRAN)
|
||||||
- -@echo "TIMER = INT_ETIME" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "TIMER = INT_ETIME" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
-ifdef SMP
|
-ifdef SMP
|
||||||
|
-ifeq ($(OSNAME), WINNT)
|
||||||
|
- -@echo "LOADER = $(FC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
|
-else ifeq ($(OSNAME), Haiku)
|
||||||
|
- -@echo "LOADER = $(FC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
|
-else
|
||||||
- -@echo "LOADER = $(FC) -pthread" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "LOADER = $(FC) -pthread" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
|
-endif
|
||||||
-else
|
-else
|
||||||
- -@echo "LOADER = $(FC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "LOADER = $(FC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
-endif
|
-endif
|
||||||
@ -67,17 +89,22 @@ diff -up OpenBLAS-0.2.15/Makefile.system_lapack OpenBLAS-0.2.15/Makefile
|
|||||||
- -@echo "TIMER = NONE" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "TIMER = NONE" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@echo "LOADER = $(FC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@echo "LOADER = $(FC)" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
-endif
|
-endif
|
||||||
|
-ifeq ($(BUILD_LAPACK_DEPRECATED), 1)
|
||||||
|
- -@echo "BUILD_DEPRECATED = 1" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
|
-endif
|
||||||
|
- -@echo "LAPACKE_WITH_TMG = 1" >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
- -@cat make.inc >> $(NETLIB_LAPACK_DIR)/make.inc
|
- -@cat make.inc >> $(NETLIB_LAPACK_DIR)/make.inc
|
||||||
-endif
|
-endif
|
||||||
+ @$(MAKE) -C $(NETLIB_LAPACK_DIR)
|
+ @$(MAKE) -C $(NETLIB_LAPACK_DIR)
|
||||||
|
|
||||||
large.tgz :
|
large.tgz :
|
||||||
ifndef NOFORTRAN
|
ifeq ($(NOFORTRAN), $(filter 0,$(NOFORTRAN)))
|
||||||
diff -up OpenBLAS-0.2.15/Makefile.system.system_lapack OpenBLAS-0.2.15/Makefile.system
|
diff --git a/Makefile.system b/Makefile.system
|
||||||
--- OpenBLAS-0.2.15/Makefile.system.system_lapack 2015-10-27 13:44:50.000000000 -0700
|
index 8d78b42..47d8eec 100644
|
||||||
+++ OpenBLAS-0.2.15/Makefile.system 2015-10-28 09:14:39.994350500 -0700
|
--- a/Makefile.system
|
||||||
@@ -9,7 +9,7 @@ ifndef TOPDIR
|
+++ b/Makefile.system
|
||||||
TOPDIR = .
|
@@ -31,7 +31,7 @@ else ifeq ($(ARCH), zarch)
|
||||||
|
override ARCH=zarch
|
||||||
endif
|
endif
|
||||||
|
|
||||||
-NETLIB_LAPACK_DIR = $(TOPDIR)/lapack-netlib
|
-NETLIB_LAPACK_DIR = $(TOPDIR)/lapack-netlib
|
@ -1,26 +1,22 @@
|
|||||||
diff -up OpenBLAS-0.3.21/Makefile.fixtests OpenBLAS-0.3.21/Makefile
|
diff --git a/Makefile b/Makefile
|
||||||
--- OpenBLAS-0.3.21/Makefile.fixtests 2022-08-26 07:37:06.257272957 +0200
|
index 555d1c46..7dc74273 100644
|
||||||
+++ OpenBLAS-0.3.21/Makefile 2022-08-26 07:37:53.168414307 +0200
|
--- a/Makefile
|
||||||
@@ -147,18 +147,18 @@ tests :
|
+++ b/Makefile
|
||||||
|
@@ -144,13 +144,13 @@ tests :
|
||||||
ifeq ($(NOFORTRAN), $(filter 0,$(NOFORTRAN)))
|
ifeq ($(NOFORTRAN), $(filter 0,$(NOFORTRAN)))
|
||||||
touch $(LIBNAME)
|
touch $(LIBNAME)
|
||||||
ifndef NO_FBLAS
|
ifndef NO_FBLAS
|
||||||
- $(MAKE) -C test all
|
- $(MAKE) -C test all
|
||||||
+ $(MAKE) -C test FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
+ $(MAKE) -C test FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
||||||
endif
|
endif
|
||||||
endif
|
|
||||||
ifneq ($(ONLY_CBLAS), 1)
|
|
||||||
- $(MAKE) -C utest all
|
- $(MAKE) -C utest all
|
||||||
+ $(MAKE) -C utest FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
+ $(MAKE) -C utest FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
||||||
endif
|
|
||||||
ifneq ($(NO_CBLAS), 1)
|
ifneq ($(NO_CBLAS), 1)
|
||||||
ifneq ($(ONLY_CBLAS), 1)
|
|
||||||
- $(MAKE) -C ctest all
|
- $(MAKE) -C ctest all
|
||||||
+ $(MAKE) -C ctest FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
+ $(MAKE) -C ctest FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
||||||
endif
|
|
||||||
ifeq ($(CPP_THREAD_SAFETY_TEST), 1)
|
ifeq ($(CPP_THREAD_SAFETY_TEST), 1)
|
||||||
- $(MAKE) -C cpp_thread_test all
|
- $(MAKE) -C cpp_thread_test all
|
||||||
+ $(MAKE) -C cpp_thread_test FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
+ $(MAKE) -C cpp_thread_test FC="$(FC)" CC="$(CC)" COMMON_OPT="$(COMMON_OPT)" FCOMMON_OPT="$(FCOMMON_OPT)" all
|
||||||
endif
|
endif
|
||||||
endif
|
endif
|
||||||
|
endif
|
107
SOURCES/openblas-CVE-2021-4048.patch
Normal file
107
SOURCES/openblas-CVE-2021-4048.patch
Normal file
@ -0,0 +1,107 @@
|
|||||||
|
From 2be5ee3cca97a597f2ee2118808a2d5eacea050c Mon Sep 17 00:00:00 2001
|
||||||
|
From: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
||||||
|
Date: Fri, 1 Oct 2021 11:17:21 +0200
|
||||||
|
Subject: [PATCH 1/4] Fix out of bounds read in ?llarv (Reference-LAPACK PR
|
||||||
|
625)
|
||||||
|
|
||||||
|
---
|
||||||
|
lapack-netlib/SRC/clarrv.f | 2 +-
|
||||||
|
1 file changed, 1 insertion(+), 1 deletion(-)
|
||||||
|
|
||||||
|
diff --git a/lapack-netlib/SRC/clarrv.f b/lapack-netlib/SRC/clarrv.f
|
||||||
|
index a45f55ac..26a9febc 100644
|
||||||
|
--- a/lapack-netlib/SRC/clarrv.f
|
||||||
|
+++ b/lapack-netlib/SRC/clarrv.f
|
||||||
|
@@ -351,7 +351,7 @@
|
||||||
|
*
|
||||||
|
* Quick return if possible
|
||||||
|
*
|
||||||
|
- IF( N.LE.0 ) THEN
|
||||||
|
+ IF( (N.LE.0) .OR. (M.LE.0) ) THEN
|
||||||
|
RETURN
|
||||||
|
END IF
|
||||||
|
*
|
||||||
|
--
|
||||||
|
2.34.1
|
||||||
|
|
||||||
|
|
||||||
|
From fe497efa0510466fd93578aaf9da1ad8ed4edbe7 Mon Sep 17 00:00:00 2001
|
||||||
|
From: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
||||||
|
Date: Fri, 1 Oct 2021 11:18:20 +0200
|
||||||
|
Subject: [PATCH 2/4] Fix out of bounds read in ?llarv (Reference-LAPACK PR
|
||||||
|
625)
|
||||||
|
|
||||||
|
---
|
||||||
|
lapack-netlib/SRC/dlarrv.f | 2 +-
|
||||||
|
1 file changed, 1 insertion(+), 1 deletion(-)
|
||||||
|
|
||||||
|
diff --git a/lapack-netlib/SRC/dlarrv.f b/lapack-netlib/SRC/dlarrv.f
|
||||||
|
index 4a59a2bb..a1c6e9c9 100644
|
||||||
|
--- a/lapack-netlib/SRC/dlarrv.f
|
||||||
|
+++ b/lapack-netlib/SRC/dlarrv.f
|
||||||
|
@@ -353,7 +353,7 @@
|
||||||
|
*
|
||||||
|
* Quick return if possible
|
||||||
|
*
|
||||||
|
- IF( N.LE.0 ) THEN
|
||||||
|
+ IF( (N.LE.0).OR.(M.LE.0) ) THEN
|
||||||
|
RETURN
|
||||||
|
END IF
|
||||||
|
*
|
||||||
|
--
|
||||||
|
2.34.1
|
||||||
|
|
||||||
|
|
||||||
|
From ddb0ff5353637bb5f5ad060c9620e334c143e3d7 Mon Sep 17 00:00:00 2001
|
||||||
|
From: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
||||||
|
Date: Fri, 1 Oct 2021 11:19:07 +0200
|
||||||
|
Subject: [PATCH 3/4] Fix out of bounds read in ?llarv (Reference-LAPACK PR
|
||||||
|
625)
|
||||||
|
|
||||||
|
---
|
||||||
|
lapack-netlib/SRC/slarrv.f | 2 +-
|
||||||
|
1 file changed, 1 insertion(+), 1 deletion(-)
|
||||||
|
|
||||||
|
diff --git a/lapack-netlib/SRC/slarrv.f b/lapack-netlib/SRC/slarrv.f
|
||||||
|
index 04519fde..9448b2fd 100644
|
||||||
|
--- a/lapack-netlib/SRC/slarrv.f
|
||||||
|
+++ b/lapack-netlib/SRC/slarrv.f
|
||||||
|
@@ -353,7 +353,7 @@
|
||||||
|
*
|
||||||
|
* Quick return if possible
|
||||||
|
*
|
||||||
|
- IF( N.LE.0 ) THEN
|
||||||
|
+ IF( (N.LE.0).OR.(M.LE.0) ) THEN
|
||||||
|
RETURN
|
||||||
|
END IF
|
||||||
|
*
|
||||||
|
--
|
||||||
|
2.34.1
|
||||||
|
|
||||||
|
|
||||||
|
From 337b65133df174796794871b3988cd03426e6d41 Mon Sep 17 00:00:00 2001
|
||||||
|
From: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
||||||
|
Date: Fri, 1 Oct 2021 11:19:53 +0200
|
||||||
|
Subject: [PATCH 4/4] Fix out of bounds read in ?llarv (Reference-LAPACK PR
|
||||||
|
625)
|
||||||
|
|
||||||
|
---
|
||||||
|
lapack-netlib/SRC/zlarrv.f | 2 +-
|
||||||
|
1 file changed, 1 insertion(+), 1 deletion(-)
|
||||||
|
|
||||||
|
diff --git a/lapack-netlib/SRC/zlarrv.f b/lapack-netlib/SRC/zlarrv.f
|
||||||
|
index 23976dbe..8d10e3c2 100644
|
||||||
|
--- a/lapack-netlib/SRC/zlarrv.f
|
||||||
|
+++ b/lapack-netlib/SRC/zlarrv.f
|
||||||
|
@@ -351,7 +351,7 @@
|
||||||
|
*
|
||||||
|
* Quick return if possible
|
||||||
|
*
|
||||||
|
- IF( N.LE.0 ) THEN
|
||||||
|
+ IF( (N.LE.0).OR.(M.LE.0) ) THEN
|
||||||
|
RETURN
|
||||||
|
END IF
|
||||||
|
*
|
||||||
|
--
|
||||||
|
2.34.1
|
||||||
|
|
@ -1,6 +1,9 @@
|
|||||||
%bcond_with system_lapack
|
%bcond_with system_lapack
|
||||||
# Version of bundled lapack
|
# Version of bundled lapack
|
||||||
%global lapackver 3.11.0
|
%global lapackver 3.9.1
|
||||||
|
|
||||||
|
# Use strip from gcc-toolset-12
|
||||||
|
%global __strip "scl enable gcc-toolset-12 -- strip"
|
||||||
|
|
||||||
# DO NOT "CLEAN UP" OR MODIFY THIS SPEC FILE WITHOUT ASKING THE
|
# DO NOT "CLEAN UP" OR MODIFY THIS SPEC FILE WITHOUT ASKING THE
|
||||||
# MAINTAINER FIRST!
|
# MAINTAINER FIRST!
|
||||||
@ -14,35 +17,35 @@
|
|||||||
# "obsoleted" features are still kept in the spec.
|
# "obsoleted" features are still kept in the spec.
|
||||||
|
|
||||||
Name: openblas
|
Name: openblas
|
||||||
Version: 0.3.26
|
Version: 0.3.15
|
||||||
Release: 2%{?dist}
|
Release: 6%{?dist}
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2
|
Summary: An optimized BLAS library based on GotoBLAS2
|
||||||
License: BSD-3-Clause
|
Group: Development/Libraries
|
||||||
URL: https://github.com/OpenMathLib/OpenBLAS
|
License: BSD
|
||||||
Source0: %url/archive/v%{version}/OpenBLAS-%{version}.tar.gz
|
URL: https://github.com/xianyi/OpenBLAS/
|
||||||
|
Source0: https://github.com/xianyi/OpenBLAS/archive/v%{version}.tar.gz
|
||||||
# Use system lapack
|
# Use system lapack
|
||||||
Patch0: openblas-0.2.15-system_lapack.patch
|
Patch0: openblas-0.3.15-system-lapack.patch
|
||||||
# Drop extra p from threaded library name
|
# Drop extra p from threaded library name
|
||||||
Patch1: openblas-0.2.5-libname.patch
|
Patch1: openblas-0.3.15-libname.patch
|
||||||
# Don't use constructor priorities on too old architectures
|
|
||||||
Patch2: openblas-0.2.15-constructor.patch
|
|
||||||
# Supply the proper flags to the test makefile
|
# Supply the proper flags to the test makefile
|
||||||
Patch3: openblas-0.3.11-tests.patch
|
Patch2: openblas-0.3.15-tests.patch
|
||||||
# Fix incompatible pointer types (causes FTBFS on ppc64le)
|
# Enable optimizations for all LAPACK sources
|
||||||
Patch4: openblas-0.3.26-incompatibletypes.patch
|
Patch3: openblas-0.3.15-noopt.patch
|
||||||
|
# Pass ASMFLAGS to assembler compiler
|
||||||
|
Patch4: openblas-0.3.15-asmflags.patch
|
||||||
|
# Remove optimization pragmas on ppc64le
|
||||||
|
Patch5: openblas-0.3.15-power-optimize.patch
|
||||||
|
|
||||||
BuildRequires: make
|
Patch6: openblas-CVE-2021-4048.patch
|
||||||
BuildRequires: gcc
|
|
||||||
BuildRequires: gcc-c++
|
BuildRequires: scl-utils
|
||||||
BuildRequires: gcc-gfortran
|
BuildRequires: gcc-toolset-12-gcc
|
||||||
|
BuildRequires: gcc-toolset-12-gcc-gfortran
|
||||||
|
BuildRequires: gcc-toolset-12-annobin-plugin-gcc
|
||||||
BuildRequires: perl-devel
|
BuildRequires: perl-devel
|
||||||
BuildRequires: multilib-rpm-config
|
BuildRequires: multilib-rpm-config
|
||||||
|
|
||||||
# Rblas library is no longer necessary
|
|
||||||
%if 0%{?fedora} >= 31 || 0%{?rhel} >= 8
|
|
||||||
Obsoletes: %{name}-Rblas < %{version}-%{release}
|
|
||||||
%endif
|
|
||||||
|
|
||||||
# Do we have execstack?
|
# Do we have execstack?
|
||||||
%if 0%{?rhel} == 7
|
%if 0%{?rhel} == 7
|
||||||
%ifarch ppc64le aarch64
|
%ifarch ppc64le aarch64
|
||||||
@ -80,10 +83,8 @@ Provides: bundled(lapack) = %{lapackver}
|
|||||||
# Build 64-bit interface binaries?
|
# Build 64-bit interface binaries?
|
||||||
%if 0%{?__isa_bits} == 64
|
%if 0%{?__isa_bits} == 64
|
||||||
%global build64 1
|
%global build64 1
|
||||||
%bcond_without cpp_thread_check
|
|
||||||
%else
|
%else
|
||||||
%global build64 0
|
%global build64 0
|
||||||
%bcond_with cpp_thread_check
|
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
%if %{with system_lapack}
|
%if %{with system_lapack}
|
||||||
@ -105,103 +106,98 @@ Computational Science, ISCAS. http://www.rdcps.ac.cn
|
|||||||
%description
|
%description
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
%package serial
|
%package Rblas
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, serial version
|
Summary: A version of OpenBLAS for R to use as libRblas
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description serial
|
%description Rblas
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the sequential library compiled with a 32-bit
|
|
||||||
integer interface.
|
|
||||||
|
|
||||||
%package openmp
|
%package openmp
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, OpenMP version
|
Summary: An optimized BLAS library based on GotoBLAS2, OpenMP version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description openmp
|
%description openmp
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the library compiled with OpenMP support with
|
This package contains the library compiled with OpenMP support.
|
||||||
32-bit integer interface.
|
|
||||||
|
|
||||||
%package threads
|
%package threads
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, pthreads version
|
Summary: An optimized BLAS library based on GotoBLAS2, pthreads version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description threads
|
%description threads
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the library compiled with threading support and
|
This package contains the library compiled with threading support.
|
||||||
a 32-bit integer interface.
|
|
||||||
|
|
||||||
%if %build64
|
%if %build64
|
||||||
%package serial64
|
%package serial64
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, serial version
|
Summary: An optimized BLAS library based on GotoBLAS2, serial version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description serial64
|
%description serial64
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the sequential library compiled with a 64-bit
|
This package contains the sequential library compiled with a 64-bit
|
||||||
integer interface.
|
interface.
|
||||||
|
|
||||||
%package openmp64
|
%package openmp64
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, OpenMP version
|
Summary: An optimized BLAS library based on GotoBLAS2, OpenMP version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description openmp64
|
%description openmp64
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the library compiled with OpenMP support and
|
This package contains the library compiled with OpenMP support and
|
||||||
64-bit integer interface.
|
64-bit interface.
|
||||||
|
|
||||||
%package threads64
|
%package threads64
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, pthreads version
|
Summary: An optimized BLAS library based on GotoBLAS2, pthreads version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description threads64
|
%description threads64
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the library compiled with threading support and
|
This package contains the library compiled with threading support and
|
||||||
64-bit integer interface.
|
64-bit interface.
|
||||||
|
|
||||||
%package serial64_
|
%package serial64_
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, serial version
|
Summary: An optimized BLAS library based on GotoBLAS2, serial version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description serial64_
|
%description serial64_
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the sequential library compiled with a 64-bit
|
This package contains the sequential library compiled with a 64-bit
|
||||||
integer interface and a symbol name suffix.
|
interface and a symbol name suffix.
|
||||||
|
|
||||||
%package openmp64_
|
%package openmp64_
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, OpenMP version
|
Summary: An optimized BLAS library based on GotoBLAS2, OpenMP version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description openmp64_
|
%description openmp64_
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the library compiled with OpenMP support and
|
This package contains the library compiled with OpenMP support and
|
||||||
64-bit integer interface and a symbol name suffix.
|
64-bit interface and a symbol name suffix.
|
||||||
|
|
||||||
%package threads64_
|
%package threads64_
|
||||||
Summary: An optimized BLAS library based on GotoBLAS2, pthreads version
|
Summary: An optimized BLAS library based on GotoBLAS2, pthreads version
|
||||||
Requires: %{name} = %{version}-%{release}
|
Group: Development/Libraries
|
||||||
|
|
||||||
%description threads64_
|
%description threads64_
|
||||||
%{base_description}
|
%{base_description}
|
||||||
|
|
||||||
This package contains the library compiled with threading support and
|
This package contains the library compiled with threading support and
|
||||||
64-bit integer interface and a symbol name suffix.
|
64-bit interface and a symbol name suffix.
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
|
|
||||||
%package devel
|
%package devel
|
||||||
Summary: Development headers and libraries for OpenBLAS
|
Summary: Development headers and libraries for OpenBLAS
|
||||||
|
Group: Development/Libraries
|
||||||
Requires: %{name}%{?_isa} = %{version}-%{release}
|
Requires: %{name}%{?_isa} = %{version}-%{release}
|
||||||
Requires: %{name}-serial%{?_isa} = %{version}-%{release}
|
|
||||||
Requires: %{name}-openmp%{?_isa} = %{version}-%{release}
|
Requires: %{name}-openmp%{?_isa} = %{version}-%{release}
|
||||||
Requires: %{name}-threads%{?_isa} = %{version}-%{release}
|
Requires: %{name}-threads%{?_isa} = %{version}-%{release}
|
||||||
%if %build64
|
%if %build64
|
||||||
@ -221,6 +217,7 @@ This package contains the development headers and libraries.
|
|||||||
|
|
||||||
%package static
|
%package static
|
||||||
Summary: Static version of OpenBLAS
|
Summary: Static version of OpenBLAS
|
||||||
|
Group: Development/Libraries
|
||||||
Requires: %{name}-devel%{?_isa} = %{version}-%{release}
|
Requires: %{name}-devel%{?_isa} = %{version}-%{release}
|
||||||
|
|
||||||
%description static
|
%description static
|
||||||
@ -236,14 +233,14 @@ This package contains the static libraries.
|
|||||||
tar zxf %{SOURCE0}
|
tar zxf %{SOURCE0}
|
||||||
cd OpenBLAS-%{version}
|
cd OpenBLAS-%{version}
|
||||||
%if %{with system_lapack}
|
%if %{with system_lapack}
|
||||||
%patch0 -p1 -b .system_lapack
|
%patch0 -p1 -b .system-lapack
|
||||||
%endif
|
%endif
|
||||||
%patch1 -p1 -b .libname
|
%patch1 -p1 -b .libname
|
||||||
%if 0%{?rhel} == 5
|
%patch2 -p1 -b .tests
|
||||||
%patch2 -p1 -b .constructor
|
%patch3 -p1 -b .noopt
|
||||||
%endif
|
%patch4 -p1 -b .asmflags
|
||||||
%patch3 -p1 -b .tests
|
%patch5 -p1 -b .power-optimize
|
||||||
%patch4 -p1 -b .incompatibletypes
|
%patch6 -p1 -b .cve-2021-4048
|
||||||
|
|
||||||
# Fix source permissions
|
# Fix source permissions
|
||||||
find -name \*.f -exec chmod 644 {} \;
|
find -name \*.f -exec chmod 644 {} \;
|
||||||
@ -254,6 +251,7 @@ rm -rf lapack-netlib
|
|||||||
%endif
|
%endif
|
||||||
|
|
||||||
# Make serial, threaded and OpenMP versions; as well as 64-bit versions
|
# Make serial, threaded and OpenMP versions; as well as 64-bit versions
|
||||||
|
# Also make an libRblas.so
|
||||||
cd ..
|
cd ..
|
||||||
cp -ar OpenBLAS-%{version} openmp
|
cp -ar OpenBLAS-%{version} openmp
|
||||||
cp -ar OpenBLAS-%{version} threaded
|
cp -ar OpenBLAS-%{version} threaded
|
||||||
@ -262,8 +260,14 @@ for d in {serial,threaded,openmp}64{,_}; do
|
|||||||
cp -ar OpenBLAS-%{version} $d
|
cp -ar OpenBLAS-%{version} $d
|
||||||
done
|
done
|
||||||
%endif
|
%endif
|
||||||
|
cp -ar OpenBLAS-%{version} Rblas
|
||||||
mv OpenBLAS-%{version} serial
|
mv OpenBLAS-%{version} serial
|
||||||
|
|
||||||
|
# Hackup Rblas Makefiles
|
||||||
|
sed -i 's|.so.$(MAJOR_VERSION)|.so|g' Rblas/Makefile
|
||||||
|
sed -i 's|.so.$(MAJOR_VERSION)|.so|g' Rblas/exports/Makefile
|
||||||
|
sed -i 's|@ln -fs $(LIBSONAME) $(LIBPREFIX).so|#@ln -fs $(LIBSONAME) $(LIBPREFIX).so|g' Rblas/Makefile
|
||||||
|
|
||||||
%if %{with system_lapack}
|
%if %{with system_lapack}
|
||||||
# Setup 32-bit interface LAPACK
|
# Setup 32-bit interface LAPACK
|
||||||
mkdir netliblapack
|
mkdir netliblapack
|
||||||
@ -340,9 +344,9 @@ rm -rf netliblapack64
|
|||||||
%endif
|
%endif
|
||||||
|
|
||||||
%build
|
%build
|
||||||
# openblas fails to build with LTO due to undefined symbols. These could
|
# Enable gcc-toolset-12
|
||||||
# well be the result of the assembly code used in this package
|
source scl_source enable gcc-toolset-12
|
||||||
%define _lto_cflags %{nil}
|
|
||||||
%if !%{lapacke}
|
%if !%{lapacke}
|
||||||
LAPACKE="NO_LAPACKE=1"
|
LAPACKE="NO_LAPACKE=1"
|
||||||
%endif
|
%endif
|
||||||
@ -376,7 +380,7 @@ TARGET="TARGET=POWER7 DYNAMIC_ARCH=1 DYNAMIC_OLDER=1"
|
|||||||
TARGET="TARGET=POWER8 DYNAMIC_ARCH=1 DYNAMIC_OLDER=1"
|
TARGET="TARGET=POWER8 DYNAMIC_ARCH=1 DYNAMIC_OLDER=1"
|
||||||
%endif
|
%endif
|
||||||
%ifarch aarch64
|
%ifarch aarch64
|
||||||
TARGET="TARGET=ARMV8 DYNAMIC_ARCH=1 DYNAMIC_OLDER=1"
|
TARGET="TARGET=ARMV8 DYNAMIC_ARCH=0"
|
||||||
%endif
|
%endif
|
||||||
%ifarch s390x
|
%ifarch s390x
|
||||||
TARGET="TARGET=ZARCH_GENERIC DYNAMIC_ARCH=1 DYNAMIC_OLDER=1"
|
TARGET="TARGET=ZARCH_GENERIC DYNAMIC_ARCH=1 DYNAMIC_OLDER=1"
|
||||||
@ -385,46 +389,54 @@ TARGET="TARGET=ZARCH_GENERIC DYNAMIC_ARCH=1 DYNAMIC_OLDER=1"
|
|||||||
%if 0%{?rhel} == 5
|
%if 0%{?rhel} == 5
|
||||||
# Gfortran too old to recognize -frecursive
|
# Gfortran too old to recognize -frecursive
|
||||||
COMMON="%{optflags} -fPIC"
|
COMMON="%{optflags} -fPIC"
|
||||||
FCOMMON="%{optflags} -fPIC"
|
FCOMMON="%{optflags} -fPIC -cpp"
|
||||||
%else
|
%else
|
||||||
COMMON="%{optflags} -fPIC"
|
COMMON="%{optflags} -fPIC"
|
||||||
FCOMMON="%{optflags} -fPIC -frecursive"
|
FCOMMON="%{optflags} -fPIC -frecursive -cpp"
|
||||||
%endif
|
%endif
|
||||||
# Use Fedora linker flags
|
# Use Fedora linker flags
|
||||||
export LDFLAGS="%{__global_ldflags}"
|
export LDFLAGS="%{__global_ldflags}"
|
||||||
|
|
||||||
|
# ensure object files built from assembler sources are annotated
|
||||||
|
export ASMFLAGS="-Wa,--generate-missing-build-notes=yes"
|
||||||
|
|
||||||
|
make -C Rblas $TARGET USE_THREAD=0 USEOPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libRblas" LIBSONAME="libRblas.so" $AVX $LAPACKE INTERFACE64=0
|
||||||
|
|
||||||
# Declare some necessary build flags
|
# Declare some necessary build flags
|
||||||
COMMON="%{optflags} -fPIC"
|
COMMON="%{optflags} -fPIC"
|
||||||
FCOMMON="$COMMON -frecursive"
|
FCOMMON="$COMMON -frecursive -cpp"
|
||||||
make -C serial $TARGET USE_THREAD=0 USE_LOCKING=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblas" $AVX $LAPACKE INTERFACE64=0
|
make -C serial $TARGET USE_THREAD=0 USE_LOCKING=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblas" $AVX $LAPACKE INTERFACE64=0
|
||||||
make -C threaded $TARGET USE_THREAD=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblasp" $AVX $LAPACKE INTERFACE64=0
|
make -C threaded $TARGET USE_THREAD=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblasp" $AVX $LAPACKE INTERFACE64=0
|
||||||
|
|
||||||
# USE_THREAD determines use of SMP, not of pthreads
|
# USE_THREAD determines use of SMP, not of pthreads
|
||||||
COMMON="%{optflags} -fPIC -fopenmp -pthread"
|
COMMON="%{optflags} -fPIC -fopenmp -pthread"
|
||||||
FCOMMON="$COMMON -frecursive"
|
FCOMMON="$COMMON -frecursive -cpp"
|
||||||
make -C openmp $TARGET USE_THREAD=1 USE_OPENMP=1 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblaso" $AVX $LAPACKE INTERFACE64=0 %{with cpp_thread_check:CPP_THREAD_SAFETY_TEST=1}
|
make -C openmp $TARGET USE_THREAD=1 USE_OPENMP=1 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblaso" $AVX $LAPACKE INTERFACE64=0
|
||||||
|
|
||||||
%if %build64
|
%if %build64
|
||||||
COMMON="%{optflags} -fPIC"
|
COMMON="%{optflags} -fPIC"
|
||||||
FCOMMON="$COMMON -frecursive -fdefault-integer-8"
|
FCOMMON="$COMMON -frecursive -fdefault-integer-8 -cpp"
|
||||||
make -C serial64 $TARGET USE_THREAD=0 USE_LOCKING=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblas64" $AVX $LAPACKE INTERFACE64=1
|
make -C serial64 $TARGET USE_THREAD=0 USE_LOCKING=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblas64" $AVX $LAPACKE INTERFACE64=1
|
||||||
make -C threaded64 $TARGET USE_THREAD=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblasp64" $AVX $LAPACKE INTERFACE64=1
|
make -C threaded64 $TARGET USE_THREAD=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblasp64" $AVX $LAPACKE INTERFACE64=1
|
||||||
|
|
||||||
COMMON="%{optflags} -fPIC -fopenmp -pthread"
|
COMMON="%{optflags} -fPIC -fopenmp -pthread"
|
||||||
FCOMMON="$COMMON -frecursive -fdefault-integer-8"
|
FCOMMON="$COMMON -frecursive -fdefault-integer-8 -cpp"
|
||||||
make -C openmp64 $TARGET USE_THREAD=1 USE_OPENMP=1 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblaso64" $AVX $LAPACKE INTERFACE64=1 CPP_THREAD_SAFETY_TEST=1
|
make -C openmp64 $TARGET USE_THREAD=1 USE_OPENMP=1 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblaso64" $AVX $LAPACKE INTERFACE64=1
|
||||||
|
|
||||||
COMMON="%{optflags} -fPIC"
|
COMMON="%{optflags} -fPIC"
|
||||||
FCOMMON="$COMMON -frecursive -fdefault-integer-8"
|
FCOMMON="$COMMON -frecursive -fdefault-integer-8 -cpp"
|
||||||
make -C serial64_ $TARGET USE_THREAD=0 USE_LOCKING=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblas64_" $AVX $LAPACKE INTERFACE64=1 SYMBOLSUFFIX=64_
|
make -C serial64_ $TARGET USE_THREAD=0 USE_LOCKING=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblas64_" $AVX $LAPACKE INTERFACE64=1 SYMBOLSUFFIX=64_
|
||||||
make -C threaded64_ $TARGET USE_THREAD=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblasp64_" $AVX $LAPACKE INTERFACE64=1 SYMBOLSUFFIX=64_
|
make -C threaded64_ $TARGET USE_THREAD=1 USE_OPENMP=0 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblasp64_" $AVX $LAPACKE INTERFACE64=1 SYMBOLSUFFIX=64_
|
||||||
|
|
||||||
COMMON="%{optflags} -fPIC -fopenmp -pthread"
|
COMMON="%{optflags} -fPIC -fopenmp -pthread"
|
||||||
FCOMMON="$COMMON -frecursive -fdefault-integer-8"
|
FCOMMON="$COMMON -frecursive -fdefault-integer-8 -cpp"
|
||||||
make -C openmp64_ $TARGET USE_THREAD=1 USE_OPENMP=1 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblaso64_" $AVX $LAPACKE INTERFACE64=1 SYMBOLSUFFIX=64_ CPP_THREAD_SAFETY_TEST=1
|
make -C openmp64_ $TARGET USE_THREAD=1 USE_OPENMP=1 FC=gfortran CC=gcc COMMON_OPT="$COMMON" FCOMMON_OPT="$FCOMMON" $NMAX LIBPREFIX="libopenblaso64_" $AVX $LAPACKE INTERFACE64=1 SYMBOLSUFFIX=64_
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
%install
|
%install
|
||||||
|
# Enable gcc-toolset-12
|
||||||
|
source scl_source enable gcc-toolset-12
|
||||||
|
|
||||||
rm -rf %{buildroot}
|
rm -rf %{buildroot}
|
||||||
# Install serial library and headers
|
# Install serial library and headers
|
||||||
make -C serial USE_THREAD=0 DESTDIR=%{buildroot} OPENBLAS_LIBRARY_DIR=%{_libdir} OPENBLAS_INCLUDE_DIR=%{_includedir}/%name OPENBLAS_BINARY_DIR=%{_bindir} OPENBLAS_CMAKE_DIR=%{_libdir}/cmake install
|
make -C serial USE_THREAD=0 DESTDIR=%{buildroot} OPENBLAS_LIBRARY_DIR=%{_libdir} OPENBLAS_INCLUDE_DIR=%{_includedir}/%name OPENBLAS_BINARY_DIR=%{_bindir} OPENBLAS_CMAKE_DIR=%{_libdir}/cmake install
|
||||||
@ -443,6 +455,9 @@ suffix=""
|
|||||||
%ifarch armv7hl
|
%ifarch armv7hl
|
||||||
suffix="_armv7"
|
suffix="_armv7"
|
||||||
%endif
|
%endif
|
||||||
|
%ifarch aarch64
|
||||||
|
suffix="_armv8"
|
||||||
|
%endif
|
||||||
slibname=`basename %{buildroot}%{_libdir}/libopenblas${suffix}-*.so .so`
|
slibname=`basename %{buildroot}%{_libdir}/libopenblas${suffix}-*.so .so`
|
||||||
mv %{buildroot}%{_libdir}/${slibname}.a %{buildroot}%{_libdir}/lib%{name}.a
|
mv %{buildroot}%{_libdir}/${slibname}.a %{buildroot}%{_libdir}/lib%{name}.a
|
||||||
if [[ "$suffix" != "" ]]; then
|
if [[ "$suffix" != "" ]]; then
|
||||||
@ -452,6 +467,10 @@ else
|
|||||||
sname=${slibname}
|
sname=${slibname}
|
||||||
fi
|
fi
|
||||||
|
|
||||||
|
# Install the Rblas library
|
||||||
|
mkdir -p %{buildroot}%{_libdir}/R/lib/
|
||||||
|
install -p -m 755 Rblas/libRblas.so %{buildroot}%{_libdir}/R/lib/
|
||||||
|
|
||||||
# Install the OpenMP library
|
# Install the OpenMP library
|
||||||
olibname=`echo ${slibname} | sed "s|lib%{name}|lib%{name}o|g"`
|
olibname=`echo ${slibname} | sed "s|lib%{name}|lib%{name}o|g"`
|
||||||
install -D -p -m 644 openmp/${olibname}.a %{buildroot}%{_libdir}/lib%{name}o.a
|
install -D -p -m 644 openmp/${olibname}.a %{buildroot}%{_libdir}/lib%{name}o.a
|
||||||
@ -555,33 +574,45 @@ ln -sf ${pname64_}.so lib%{name}p64_.so.0
|
|||||||
for lib in %{buildroot}%{_libdir}/libopenblas*.so; do
|
for lib in %{buildroot}%{_libdir}/libopenblas*.so; do
|
||||||
execstack -c $lib
|
execstack -c $lib
|
||||||
done
|
done
|
||||||
|
for lib in %{buildroot}%{_libdir}/R/lib/libRblas*.so; do
|
||||||
|
execstack -c $lib
|
||||||
|
done
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
# Get rid of generated CMake config
|
# Get rid of generated CMake config
|
||||||
rm -rf %{buildroot}%{_libdir}/cmake
|
rm -rf %{buildroot}%{_libdir}/cmake
|
||||||
|
|
||||||
%ldconfig_scriptlets
|
%post -p /sbin/ldconfig
|
||||||
|
%postun -p /sbin/ldconfig
|
||||||
|
|
||||||
%ldconfig_scriptlets openmp
|
%post openmp -p /sbin/ldconfig
|
||||||
|
%postun openmp -p /sbin/ldconfig
|
||||||
|
|
||||||
%ldconfig_scriptlets threads
|
%post Rblas -p /sbin/ldconfig
|
||||||
|
%postun Rblas -p /sbin/ldconfig
|
||||||
|
|
||||||
|
%post threads -p /sbin/ldconfig
|
||||||
|
%postun threads -p /sbin/ldconfig
|
||||||
|
|
||||||
%if %build64
|
%if %build64
|
||||||
%ldconfig_scriptlets openmp64
|
%post openmp64 -p /sbin/ldconfig
|
||||||
%ldconfig_scriptlets openmp64_
|
%postun openmp64 -p /sbin/ldconfig
|
||||||
|
%post openmp64_ -p /sbin/ldconfig
|
||||||
|
%postun openmp64_ -p /sbin/ldconfig
|
||||||
|
|
||||||
%ldconfig_scriptlets serial64
|
%post serial64 -p /sbin/ldconfig
|
||||||
%ldconfig_scriptlets serial64_
|
%postun serial64 -p /sbin/ldconfig
|
||||||
|
%post serial64_ -p /sbin/ldconfig
|
||||||
|
%postun serial64_ -p /sbin/ldconfig
|
||||||
|
|
||||||
%ldconfig_scriptlets threads64
|
%post threads64 -p /sbin/ldconfig
|
||||||
%ldconfig_scriptlets threads64_
|
%postun threads64 -p /sbin/ldconfig
|
||||||
|
%post threads64_ -p /sbin/ldconfig
|
||||||
|
%postun threads64_ -p /sbin/ldconfig
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
%files
|
%files
|
||||||
%license serial/LICENSE
|
%doc serial/Changelog.txt serial/GotoBLAS* serial/LICENSE
|
||||||
%doc serial/Changelog.txt serial/GotoBLAS*
|
|
||||||
|
|
||||||
%files serial
|
|
||||||
%{_libdir}/lib%{name}-*.so
|
%{_libdir}/lib%{name}-*.so
|
||||||
%{_libdir}/lib%{name}.so.*
|
%{_libdir}/lib%{name}.so.*
|
||||||
|
|
||||||
@ -635,6 +666,9 @@ rm -rf %{buildroot}%{_libdir}/cmake
|
|||||||
%{_libdir}/lib%{name}p64_.so
|
%{_libdir}/lib%{name}p64_.so
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
|
%files Rblas
|
||||||
|
%{_libdir}/R/lib/libRblas.so
|
||||||
|
|
||||||
%files static
|
%files static
|
||||||
%{_libdir}/lib%{name}.a
|
%{_libdir}/lib%{name}.a
|
||||||
%{_libdir}/lib%{name}o.a
|
%{_libdir}/lib%{name}o.a
|
||||||
@ -649,163 +683,94 @@ rm -rf %{buildroot}%{_libdir}/cmake
|
|||||||
%endif
|
%endif
|
||||||
|
|
||||||
%changelog
|
%changelog
|
||||||
* Thu Aug 22 2024 Pavel Simovec <psimovec@redhat.com> - 0.3.26-2
|
* Thu Feb 16 2023 Matej Mužila <mmuzila@redhat.com> - 0.3.15-6
|
||||||
- Re-include openblas.pc
|
|
||||||
- Resolves: RHEL-20160
|
|
||||||
|
|
||||||
* Thu Jun 27 2024 Pavel Simovec <psimovec@redhat.com> - 0.3.26-1
|
|
||||||
- Update to 0.3.26
|
|
||||||
- Resolves: RHEL-20160
|
|
||||||
|
|
||||||
* Tue Jan 31 2023 Matej Mužila <mmuzila@redhat.com> - 0.3.21-2
|
|
||||||
- Include openblas.pc
|
- Include openblas.pc
|
||||||
Resolves: #2115737
|
- Resolves: #2115722
|
||||||
|
|
||||||
* Wed Aug 24 2022 Honza Horak <hhorak@redhat.com> - 0.3.21-1
|
* Wed Feb 15 2023 Nikola Forró <nforro@redhat.com> - 0.3.15-5
|
||||||
- Update to 0.3.21
|
- Disable dynamic CPU detection on aarch64
|
||||||
Resolves: #2112099
|
- Use gcc-toolset-12
|
||||||
- Fix SBGEMM test to work with INTERFACE64 (rhbz#2120974)
|
- Resolves: #2170398
|
||||||
|
|
||||||
* Tue Jan 11 2022 Honza Horak <hhorak@redhat.com> - 0.3.15-3
|
* Wed Jun 15 2022 Matej Mužila <mmuzila@redhat.com> - 0.3.15-4
|
||||||
- Fix out of bounds read in ?llarv (Reference-LAPACK PR 625)
|
- Fix out-of-bounds read in *larrv
|
||||||
(CVE-2021-4048)
|
- Resolves: CVE-2021-4048
|
||||||
Resolves: #2029855
|
|
||||||
|
|
||||||
* Mon Aug 09 2021 Mohan Boddu <mboddu@redhat.com> - 0.3.15-2
|
* Fri Nov 12 2021 Nikola Forró <nforro@redhat.com> - 0.3.15-3
|
||||||
- Rebuilt for IMA sigs, glibc 2.34, aarch64 flags
|
- Fix missing header files in openblas-devel subpackage by enabling
|
||||||
Related: rhbz#1991688
|
gcc-toolset-11 in %%install as well
|
||||||
|
related: #1983218
|
||||||
|
|
||||||
* Thu May 06 2021 Nikola Forró <nforro@redhat.com> - 0.3.15-1
|
* Thu Oct 21 2021 Nikola Forró <nforro@redhat.com> - 0.3.15-2
|
||||||
- Update to 0.3.15.
|
- Enable dynamic cpu detection on all supported architectures
|
||||||
related: #1870676
|
related: #1983218
|
||||||
related: #1870033
|
|
||||||
|
|
||||||
* Fri Apr 16 2021 Mohan Boddu <mboddu@redhat.com> - 0.3.13-2
|
* Wed Sep 15 2021 Nikola Forró <nforro@redhat.com> - 0.3.15-1
|
||||||
- Rebuilt for RHEL 9 BETA on Apr 15th 2021. Related: rhbz#1947937
|
- Rebase to version 0.3.15
|
||||||
|
- Use gcc-toolset-11 to benefit from POWER 10 optimizations
|
||||||
|
resolves: #1983218
|
||||||
|
|
||||||
* Tue Apr 06 2021 Nikola Forró <nforro@redhat.com> - 0.3.13-1
|
* Wed Oct 28 2020 Nikola Forró <nforro@redhat.com> - 0.3.12-1
|
||||||
- Update to 0.3.13.
|
- Rebase to version 0.3.12
|
||||||
resolves: #1870676
|
related: #1847435
|
||||||
related: #1870033
|
|
||||||
|
|
||||||
* Tue Jan 26 2021 Fedora Release Engineering <releng@fedoraproject.org> - 0.3.12-2
|
* Wed Oct 21 2020 Nikola Forró <nforro@redhat.com> - 0.3.10-2
|
||||||
- Rebuilt for https://fedoraproject.org/wiki/Fedora_34_Mass_Rebuild
|
- Fix macro used in LAPACKE_zgesvdq
|
||||||
|
related: #1847435
|
||||||
|
|
||||||
* Sun Oct 25 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.12-1
|
* Tue Oct 20 2020 Nikola Forró <nforro@redhat.com> - 0.3.10-1
|
||||||
- Update to 0.3.12.
|
- Rebase to version 0.3.10
|
||||||
|
resolves: #1847435
|
||||||
|
|
||||||
* Sun Oct 18 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.11-1
|
* Fri Nov 22 2019 Nikola Forró <nforro@redhat.com> - 0.3.3-5
|
||||||
- Update to 0.3.11.
|
- Detect POWER9 as POWER8
|
||||||
|
related: #1752241
|
||||||
|
|
||||||
* Fri Sep 18 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.10-6
|
* Wed Nov 20 2019 Nikola Forró <nforro@redhat.com> - 0.3.3-4
|
||||||
- Fix incorrect result of cblas_zdotc_sub on ppc64le (BZ #1878449).
|
- Add tests and enable gating
|
||||||
|
related: #1752241
|
||||||
|
|
||||||
* Sat Aug 29 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.10-5
|
* Tue Sep 24 2019 Nikola Forró <nforro@redhat.com> - 0.3.3-3
|
||||||
- Fix unresolved bfloat16 datatype (BZ #1873667).
|
- Fix izamax on s390x
|
||||||
|
resolves: #1752241
|
||||||
|
|
||||||
* Fri Aug 14 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.10-4
|
* Wed Nov 07 2018 Nikola Forró <nforro@redhat.com> - 0.3.3-2
|
||||||
- Obsolete Rblas package (BZ #1849966).
|
- Fix i686-x86_64 multilib difference
|
||||||
|
related: #1627890
|
||||||
|
|
||||||
* Tue Aug 11 2020 Jeff Law <law@redhat.com> - 0.3.10-3
|
* Fri Oct 19 2018 Nikola Forró <nforro@redhat.com> - 0.3.3-1
|
||||||
- Disable LTO
|
- Rebase to version 0.3.3
|
||||||
|
resolves: #1627890
|
||||||
|
|
||||||
* Tue Jul 28 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.10-2
|
* Mon Oct 15 2018 Nikola Forró <nforro@redhat.com> - 0.2.20-16
|
||||||
- Include upstream patch 2672 to fix test suite on systems with few CPUs.
|
- Set proper CFLAGS also for Rblas
|
||||||
|
related: #1624156
|
||||||
|
|
||||||
* Mon Jun 15 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.10-1
|
* Fri Oct 12 2018 Nikola Forró <nforro@redhat.com> - 0.2.20-15
|
||||||
- Update to 0.3.10.
|
- Remove optimization pragmas on ppc64le
|
||||||
|
related: #1624156
|
||||||
|
|
||||||
* Thu May 28 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.9-3
|
* Wed Sep 26 2018 Nikola Forró <nforro@redhat.com> - 0.2.20-14
|
||||||
- Enable USE_LOCKING in the sequential versions of the library for
|
- Ensure object files built from assembler sources are annotated
|
||||||
thread safety.
|
related: #1624156
|
||||||
|
|
||||||
* Thu Apr 02 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.9-2
|
* Mon Sep 17 2018 Nikola Forró <nforro@redhat.com> - 0.2.20-13
|
||||||
- Patch for BZ #1820131.
|
- Fix detection of generic ARMv8 CPUs
|
||||||
|
- Get rid of executable stack in libRblas.so
|
||||||
|
related: #1624156
|
||||||
|
|
||||||
* Mon Mar 02 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.9-1
|
* Thu Sep 06 2018 Nikola Forró <nforro@redhat.com> - 0.2.20-12
|
||||||
- Update to 0.3.9.
|
- Force preprocessing of Fortran sources to make annobin record proper flags
|
||||||
|
- Enable optimizations for all LAPACK sources
|
||||||
|
resolves: #1624156
|
||||||
|
|
||||||
* Tue Feb 11 2020 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.8-1
|
* Tue Aug 14 2018 Nikola Forró <nforro@redhat.com> - 0.2.20-11
|
||||||
- Update to 0.3.8; dynamic runtime cpu detection on all architectures.
|
- Fix build on s390x (#1615557)
|
||||||
- Also updates bundled LAPACK to 3.9.0.
|
|
||||||
|
|
||||||
* Wed Jan 29 2020 Fedora Release Engineering <releng@fedoraproject.org> - 0.3.7-3
|
|
||||||
- Rebuilt for https://fedoraproject.org/wiki/Fedora_32_Mass_Rebuild
|
|
||||||
|
|
||||||
* Wed Dec 11 2019 Dominik Mierzejewski <rpm@greysector.net> - 0.3.7-2
|
|
||||||
- enable C++ thread safety test where possible
|
|
||||||
|
|
||||||
* Mon Aug 12 2019 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.7-1
|
|
||||||
- Update to 0.3.7.
|
|
||||||
|
|
||||||
* Thu Jul 25 2019 Fedora Release Engineering <releng@fedoraproject.org> - 0.3.6-3
|
|
||||||
- Rebuilt for https://fedoraproject.org/wiki/Fedora_31_Mass_Rebuild
|
|
||||||
|
|
||||||
* Tue Jul 02 2019 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.6-2
|
|
||||||
- Rebuild since older build doesn't show up in updates system.
|
|
||||||
|
|
||||||
* Tue Apr 30 2019 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.6-1
|
|
||||||
- Update to 0.3.6.
|
|
||||||
|
|
||||||
* Tue Feb 26 2019 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.5-5
|
|
||||||
- Even more assembly kernel patches.
|
|
||||||
|
|
||||||
* Mon Feb 25 2019 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.5-4
|
|
||||||
- Another assembly kernel patch.
|
|
||||||
|
|
||||||
* Sun Feb 17 2019 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.5-3
|
|
||||||
- Patch assembly kernels to satisfy gcc 9 demands.
|
|
||||||
|
|
||||||
* Fri Feb 01 2019 Fedora Release Engineering <releng@fedoraproject.org> - 0.3.5-2
|
|
||||||
- Rebuilt for https://fedoraproject.org/wiki/Fedora_30_Mass_Rebuild
|
|
||||||
|
|
||||||
* Mon Jan 07 2019 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.5-1
|
|
||||||
- Update to 0.3.5, with dynamic CPU detection on aarch64.
|
|
||||||
|
|
||||||
* Fri Nov 09 2018 Nikola Forró <nforro@redhat.com> - 0.3.3-3
|
|
||||||
- Fix i686-x86_64 multilib difference.
|
|
||||||
- Get rid of executable stack in libRblas.so.
|
|
||||||
|
|
||||||
* Sat Sep 29 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.3-2
|
|
||||||
- Fix segfault (BZ #1634060).
|
|
||||||
|
|
||||||
* Sun Sep 09 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.3-1
|
|
||||||
- Update to 0.3.3.
|
|
||||||
|
|
||||||
* Wed Aug 29 2018 Dan Horák <dan[at]danny.cz> - 0.3.2-5
|
|
||||||
- Fix precision in generic target on s390x
|
|
||||||
|
|
||||||
* Fri Aug 24 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.2-4
|
|
||||||
- Patch to avoid threading issues.
|
|
||||||
|
|
||||||
* Fri Aug 24 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.2-3
|
|
||||||
- Add missing %%{optflags} to COMMON (see discussion in #1619074).
|
|
||||||
|
|
||||||
* Wed Aug 15 2018 Dan Horák <dan[at]danny.cz> - 0.3.2-2
|
|
||||||
- Explicitly set the target to generic on s390x to avoid surprises (#1615760)
|
|
||||||
|
|
||||||
* Thu Aug 02 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.2-1
|
|
||||||
- Update to 0.3.2.
|
|
||||||
|
|
||||||
* Sun Jul 22 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.1-3
|
|
||||||
- Fix crash with multiple instances (BZ #1605231).
|
|
||||||
|
|
||||||
* Fri Jul 13 2018 Fedora Release Engineering <releng@fedoraproject.org> - 0.3.1-2
|
|
||||||
- Rebuilt for https://fedoraproject.org/wiki/Fedora_29_Mass_Rebuild
|
|
||||||
|
|
||||||
* Sun Jul 01 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.1-1
|
|
||||||
- Update to 0.3.1.
|
|
||||||
|
|
||||||
* Mon Jun 11 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.0-2
|
|
||||||
- Split sequential libraries from core package to openblas-serial.
|
|
||||||
|
|
||||||
* Thu May 24 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.3.0-1
|
|
||||||
- Update to 0.3.0.
|
|
||||||
|
|
||||||
* Thu Mar 22 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.2.20-10
|
* Thu Mar 22 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.2.20-10
|
||||||
- Disable CPU affinity unintentionally enabled upstream (BZ #1558091).
|
- Disable CPU affinity unintentionally enabled upstream (BZ #1558091).
|
||||||
|
|
||||||
* Sun Mar 04 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.2.20-9
|
* Wed Mar 04 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.2.20-9
|
||||||
- Clean up obsolete conditionals for 64 bit builds in spec file.
|
- Clean up obsolete conditionals for 64 bit builds in spec file.
|
||||||
|
|
||||||
* Tue Feb 27 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.2.20-8
|
* Tue Feb 27 2018 Susi Lehtola <jussilehtola@fedoraproject.org> - 0.2.20-8
|
@ -1,6 +0,0 @@
|
|||||||
--- !Policy
|
|
||||||
product_versions:
|
|
||||||
- rhel-9
|
|
||||||
decision_context: osci_compose_gate
|
|
||||||
rules:
|
|
||||||
- !PassingTestCaseRule {test_case_name: osci.brew-build.tier0.functional}
|
|
@ -1,19 +0,0 @@
|
|||||||
diff -up OpenBLAS-0.2.15/driver/others/memory.c.priority OpenBLAS-0.2.15/driver/others/memory.c
|
|
||||||
--- OpenBLAS-0.2.15/driver/others/memory.c.priority 2015-10-27 21:44:50.000000000 +0100
|
|
||||||
+++ OpenBLAS-0.2.15/driver/others/memory.c 2016-01-13 21:12:01.862225898 +0100
|
|
||||||
@@ -146,8 +146,15 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF
|
|
||||||
#define CONSTRUCTOR __attribute__ ((constructor))
|
|
||||||
#define DESTRUCTOR __attribute__ ((destructor))
|
|
||||||
#else
|
|
||||||
+#if __GNUC__ && INIT_PRIORITY && ((GCC_VERSION >= 40300) || (CLANG_VERSION >= 20900))
|
|
||||||
#define CONSTRUCTOR __attribute__ ((constructor(101)))
|
|
||||||
#define DESTRUCTOR __attribute__ ((destructor(101)))
|
|
||||||
+#elif __GNUC__ && INIT_PRIORITY
|
|
||||||
+#define CONSTRUCTOR __attribute__ ((constructor))
|
|
||||||
+#define DESTRUCTOR __attribute__ ((destructor))
|
|
||||||
+#else
|
|
||||||
+#define CONSTRUCTOR
|
|
||||||
+#define DESTRUCTOR
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#ifdef DYNAMIC_ARCH
|
|
@ -1,752 +0,0 @@
|
|||||||
This is a compilation of more upstream commits related to:
|
|
||||||
https://github.com/OpenMathLib/OpenBLAS/issues/4475
|
|
||||||
|
|
||||||
|
|
||||||
From 63004fa5f76ef1058975271314bc4591e7878726 Mon Sep 17 00:00:00 2001
|
|
||||||
From: Honza Horak <hhorak@redhat.com>
|
|
||||||
Date: Fri, 9 Feb 2024 09:49:41 +0100
|
|
||||||
Subject: [PATCH 1/6] Fix incompatible pointer type in BFLOAT16 mode
|
|
||||||
|
|
||||||
Upstream commit:
|
|
||||||
|
|
||||||
commit 68d354814f9f846338e1988c4f609c8add419012
|
|
||||||
Author: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
|
||||||
Date: Sun Feb 4 01:14:22 2024 +0100
|
|
||||||
|
|
||||||
Fix incompatible pointer type in BFLOAT16 mode
|
|
||||||
---
|
|
||||||
interface/gemmt.c | 4 ++--
|
|
||||||
1 file changed, 2 insertions(+), 2 deletions(-)
|
|
||||||
|
|
||||||
diff --git a/interface/gemmt.c b/interface/gemmt.c
|
|
||||||
index 046432670..2fb9954ad 100644
|
|
||||||
--- a/interface/gemmt.c
|
|
||||||
+++ b/interface/gemmt.c
|
|
||||||
@@ -478,7 +478,7 @@ void CNAME(enum CBLAS_ORDER order, enum CBLAS_UPLO Uplo,
|
|
||||||
#endif
|
|
||||||
// for alignment
|
|
||||||
buffer_size = (buffer_size + 3) & ~3;
|
|
||||||
- STACK_ALLOC(buffer_size, FLOAT, buffer);
|
|
||||||
+ STACK_ALLOC(buffer_size, IFLOAT, buffer);
|
|
||||||
|
|
||||||
#ifdef SMP
|
|
||||||
|
|
||||||
@@ -567,7 +567,7 @@ void CNAME(enum CBLAS_ORDER order, enum CBLAS_UPLO Uplo,
|
|
||||||
#endif
|
|
||||||
// for alignment
|
|
||||||
buffer_size = (buffer_size + 3) & ~3;
|
|
||||||
- STACK_ALLOC(buffer_size, FLOAT, buffer);
|
|
||||||
+ STACK_ALLOC(buffer_size, IFLOAT, buffer);
|
|
||||||
|
|
||||||
#ifdef SMP
|
|
||||||
|
|
||||||
--
|
|
||||||
2.41.0
|
|
||||||
|
|
||||||
From edfd4f52f3f22344863c233411ae792fb12aa81b Mon Sep 17 00:00:00 2001
|
|
||||||
From: Honza Horak <hhorak@redhat.com>
|
|
||||||
Date: Fri, 9 Feb 2024 09:53:40 +0100
|
|
||||||
Subject: [PATCH 2/6] Separate the interface for SBGEMMT from GEMMT due to
|
|
||||||
differences in GEMV arguments
|
|
||||||
|
|
||||||
Upstream commit:
|
|
||||||
|
|
||||||
commit d4db6a9f16a5c82bbe1860f591cc731c4d83d7c8
|
|
||||||
Author: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
|
||||||
Date: Tue Feb 6 22:23:47 2024 +0100
|
|
||||||
|
|
||||||
Separate the interface for SBGEMMT from GEMMT due to differences in GEMV arguments
|
|
||||||
---
|
|
||||||
interface/CMakeLists.txt | 1 +
|
|
||||||
interface/Makefile | 4 +-
|
|
||||||
interface/sbgemmt.c | 447 +++++++++++++++++++++++++++++++++++++++
|
|
||||||
3 files changed, 450 insertions(+), 2 deletions(-)
|
|
||||||
create mode 100644 interface/sbgemmt.c
|
|
||||||
|
|
||||||
diff --git a/interface/CMakeLists.txt b/interface/CMakeLists.txt
|
|
||||||
index 4e082928b..3110f2e90 100644
|
|
||||||
--- a/interface/CMakeLists.txt
|
|
||||||
+++ b/interface/CMakeLists.txt
|
|
||||||
@@ -119,6 +119,7 @@ endif ()
|
|
||||||
if (BUILD_BFLOAT16)
|
|
||||||
GenerateNamedObjects("bf16dot.c" "" "sbdot" ${CBLAS_FLAG} "" "" true "BFLOAT16")
|
|
||||||
GenerateNamedObjects("gemm.c" "" "sbgemm" ${CBLAS_FLAG} "" "" true "BFLOAT16")
|
|
||||||
+ GenerateNamedObjects("gemmt.c" "" "sbgemmt" ${CBLAS_FLAG} "" "" true "BFLOAT16")
|
|
||||||
GenerateNamedObjects("sbgemv.c" "" "sbgemv" ${CBLAS_FLAG} "" "" true "BFLOAT16")
|
|
||||||
GenerateNamedObjects("tobf16.c" "SINGLE_PREC" "sbstobf16" ${CBLAS_FLAG} "" "" true "BFLOAT16")
|
|
||||||
GenerateNamedObjects("tobf16.c" "DOUBLE_PREC" "sbdtobf16" ${CBLAS_FLAG} "" "" true "BFLOAT16")
|
|
||||||
diff --git a/interface/Makefile b/interface/Makefile
|
|
||||||
index 78335357b..d106ca568 100644
|
|
||||||
--- a/interface/Makefile
|
|
||||||
+++ b/interface/Makefile
|
|
||||||
@@ -1301,7 +1301,7 @@ xhpr2.$(SUFFIX) xhpr2.$(PSUFFIX) : zhpr2.c
|
|
||||||
ifeq ($(BUILD_BFLOAT16),1)
|
|
||||||
sbgemm.$(SUFFIX) sbgemm.$(PSUFFIX) : gemm.c ../param.h
|
|
||||||
$(CC) -c $(CFLAGS) $< -o $(@F)
|
|
||||||
-sbgemmt.$(SUFFIX) sbgemmt.$(PSUFFIX) : gemmt.c ../param.h
|
|
||||||
+sbgemmt.$(SUFFIX) sbgemmt.$(PSUFFIX) : sbgemmt.c ../param.h
|
|
||||||
$(CC) -c $(CFLAGS) $< -o $(@F)
|
|
||||||
endif
|
|
||||||
|
|
||||||
@@ -1932,7 +1932,7 @@ cblas_sgemmt.$(SUFFIX) cblas_sgemmt.$(PSUFFIX) : gemmt.c ../param.h
|
|
||||||
$(CC) -DCBLAS -c $(CFLAGS) $< -o $(@F)
|
|
||||||
|
|
||||||
ifeq ($(BUILD_BFLOAT16),1)
|
|
||||||
-cblas_sbgemmt.$(SUFFIX) cblas_sbgemmt.$(PSUFFIX) : gemmt.c ../param.h
|
|
||||||
+cblas_sbgemmt.$(SUFFIX) cblas_sbgemmt.$(PSUFFIX) : sbgemmt.c ../param.h
|
|
||||||
$(CC) -DCBLAS -c $(CFLAGS) $< -o $(@F)
|
|
||||||
endif
|
|
||||||
|
|
||||||
diff --git a/interface/sbgemmt.c b/interface/sbgemmt.c
|
|
||||||
new file mode 100644
|
|
||||||
index 000000000..759af4bfb
|
|
||||||
--- /dev/null
|
|
||||||
+++ b/interface/sbgemmt.c
|
|
||||||
@@ -0,0 +1,447 @@
|
|
||||||
+/*********************************************************************/
|
|
||||||
+/* Copyright 2024, The OpenBLAS Project. */
|
|
||||||
+/* All rights reserved. */
|
|
||||||
+/* */
|
|
||||||
+/* Redistribution and use in source and binary forms, with or */
|
|
||||||
+/* without modification, are permitted provided that the following */
|
|
||||||
+/* conditions are met: */
|
|
||||||
+/* */
|
|
||||||
+/* 1. Redistributions of source code must retain the above */
|
|
||||||
+/* copyright notice, this list of conditions and the following */
|
|
||||||
+/* disclaimer. */
|
|
||||||
+/* */
|
|
||||||
+/* 2. Redistributions in binary form must reproduce the above */
|
|
||||||
+/* copyright notice, this list of conditions and the following */
|
|
||||||
+/* disclaimer in the documentation and/or other materials */
|
|
||||||
+/* provided with the distribution. */
|
|
||||||
+/* */
|
|
||||||
+/* THIS SOFTWARE IS PROVIDED BY THE UNIVERSITY OF TEXAS AT */
|
|
||||||
+/* AUSTIN ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, */
|
|
||||||
+/* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF */
|
|
||||||
+/* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE */
|
|
||||||
+/* DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY OF TEXAS AT */
|
|
||||||
+/* AUSTIN OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, */
|
|
||||||
+/* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES */
|
|
||||||
+/* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE */
|
|
||||||
+/* GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR */
|
|
||||||
+/* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF */
|
|
||||||
+/* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT */
|
|
||||||
+/* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT */
|
|
||||||
+/* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE */
|
|
||||||
+/* POSSIBILITY OF SUCH DAMAGE. */
|
|
||||||
+/* */
|
|
||||||
+/*********************************************************************/
|
|
||||||
+
|
|
||||||
+#include <stdio.h>
|
|
||||||
+#include <stdlib.h>
|
|
||||||
+#include "common.h"
|
|
||||||
+
|
|
||||||
+#define SMP_THRESHOLD_MIN 65536.0
|
|
||||||
+#define ERROR_NAME "SBGEMMT "
|
|
||||||
+
|
|
||||||
+#ifndef GEMM_MULTITHREAD_THRESHOLD
|
|
||||||
+#define GEMM_MULTITHREAD_THRESHOLD 4
|
|
||||||
+#endif
|
|
||||||
+
|
|
||||||
+#ifndef CBLAS
|
|
||||||
+
|
|
||||||
+void NAME(char *UPLO, char *TRANSA, char *TRANSB,
|
|
||||||
+ blasint * M, blasint * K,
|
|
||||||
+ FLOAT * Alpha,
|
|
||||||
+ IFLOAT * a, blasint * ldA,
|
|
||||||
+ IFLOAT * b, blasint * ldB, FLOAT * Beta, FLOAT * c, blasint * ldC)
|
|
||||||
+{
|
|
||||||
+
|
|
||||||
+ blasint m, k;
|
|
||||||
+ blasint lda, ldb, ldc;
|
|
||||||
+ int transa, transb, uplo;
|
|
||||||
+ blasint info;
|
|
||||||
+
|
|
||||||
+ char transA, transB, Uplo;
|
|
||||||
+ blasint nrowa, nrowb;
|
|
||||||
+ IFLOAT *buffer;
|
|
||||||
+ IFLOAT *aa, *bb;
|
|
||||||
+ FLOAT *cc;
|
|
||||||
+ FLOAT alpha, beta;
|
|
||||||
+
|
|
||||||
+ PRINT_DEBUG_NAME;
|
|
||||||
+
|
|
||||||
+ m = *M;
|
|
||||||
+ k = *K;
|
|
||||||
+
|
|
||||||
+ alpha = *Alpha;
|
|
||||||
+ beta = *Beta;
|
|
||||||
+
|
|
||||||
+ lda = *ldA;
|
|
||||||
+ ldb = *ldB;
|
|
||||||
+ ldc = *ldC;
|
|
||||||
+
|
|
||||||
+ transA = *TRANSA;
|
|
||||||
+ transB = *TRANSB;
|
|
||||||
+ Uplo = *UPLO;
|
|
||||||
+ TOUPPER(transA);
|
|
||||||
+ TOUPPER(transB);
|
|
||||||
+ TOUPPER(Uplo);
|
|
||||||
+
|
|
||||||
+ transa = -1;
|
|
||||||
+ transb = -1;
|
|
||||||
+ uplo = -1;
|
|
||||||
+
|
|
||||||
+ if (transA == 'N')
|
|
||||||
+ transa = 0;
|
|
||||||
+ if (transA == 'T')
|
|
||||||
+ transa = 1;
|
|
||||||
+
|
|
||||||
+ if (transA == 'R')
|
|
||||||
+ transa = 0;
|
|
||||||
+ if (transA == 'C')
|
|
||||||
+ transa = 1;
|
|
||||||
+
|
|
||||||
+ if (transB == 'N')
|
|
||||||
+ transb = 0;
|
|
||||||
+ if (transB == 'T')
|
|
||||||
+ transb = 1;
|
|
||||||
+
|
|
||||||
+ if (transB == 'R')
|
|
||||||
+ transb = 0;
|
|
||||||
+ if (transB == 'C')
|
|
||||||
+ transb = 1;
|
|
||||||
+
|
|
||||||
+ if (Uplo == 'U')
|
|
||||||
+ uplo = 0;
|
|
||||||
+ if (Uplo == 'L')
|
|
||||||
+ uplo = 1;
|
|
||||||
+ nrowa = m;
|
|
||||||
+ if (transa & 1) nrowa = k;
|
|
||||||
+ nrowb = k;
|
|
||||||
+ if (transb & 1) nrowb = m;
|
|
||||||
+
|
|
||||||
+ info = 0;
|
|
||||||
+
|
|
||||||
+ if (ldc < MAX(1, m))
|
|
||||||
+ info = 13;
|
|
||||||
+ if (ldb < MAX(1, nrowb))
|
|
||||||
+ info = 10;
|
|
||||||
+ if (lda < MAX(1, nrowa))
|
|
||||||
+ info = 8;
|
|
||||||
+ if (k < 0)
|
|
||||||
+ info = 5;
|
|
||||||
+ if (m < 0)
|
|
||||||
+ info = 4;
|
|
||||||
+ if (transb < 0)
|
|
||||||
+ info = 3;
|
|
||||||
+ if (transa < 0)
|
|
||||||
+ info = 2;
|
|
||||||
+ if (uplo < 0)
|
|
||||||
+ info = 1;
|
|
||||||
+
|
|
||||||
+ if (info != 0) {
|
|
||||||
+ BLASFUNC(xerbla) (ERROR_NAME, &info, sizeof(ERROR_NAME));
|
|
||||||
+ return;
|
|
||||||
+ }
|
|
||||||
+#else
|
|
||||||
+
|
|
||||||
+void CNAME(enum CBLAS_ORDER order, enum CBLAS_UPLO Uplo,
|
|
||||||
+ enum CBLAS_TRANSPOSE TransA, enum CBLAS_TRANSPOSE TransB, blasint m,
|
|
||||||
+ blasint k,
|
|
||||||
+ FLOAT alpha,
|
|
||||||
+ IFLOAT * A, blasint LDA,
|
|
||||||
+ IFLOAT * B, blasint LDB, FLOAT beta, FLOAT * c, blasint ldc)
|
|
||||||
+{
|
|
||||||
+ IFLOAT *aa, *bb;
|
|
||||||
+ FLOAT *cc;
|
|
||||||
+
|
|
||||||
+ int transa, transb, uplo;
|
|
||||||
+ blasint info;
|
|
||||||
+ blasint lda, ldb;
|
|
||||||
+ IFLOAT *a, *b;
|
|
||||||
+ XFLOAT *buffer;
|
|
||||||
+
|
|
||||||
+ PRINT_DEBUG_CNAME;
|
|
||||||
+
|
|
||||||
+ uplo = -1;
|
|
||||||
+ transa = -1;
|
|
||||||
+ transb = -1;
|
|
||||||
+ info = 0;
|
|
||||||
+
|
|
||||||
+ if (order == CblasColMajor) {
|
|
||||||
+ if (Uplo == CblasUpper) uplo = 0;
|
|
||||||
+ if (Uplo == CblasLower) uplo = 1;
|
|
||||||
+
|
|
||||||
+ if (TransA == CblasNoTrans)
|
|
||||||
+ transa = 0;
|
|
||||||
+ if (TransA == CblasTrans)
|
|
||||||
+ transa = 1;
|
|
||||||
+
|
|
||||||
+ if (TransA == CblasConjNoTrans)
|
|
||||||
+ transa = 0;
|
|
||||||
+ if (TransA == CblasConjTrans)
|
|
||||||
+ transa = 1;
|
|
||||||
+
|
|
||||||
+ if (TransB == CblasNoTrans)
|
|
||||||
+ transb = 0;
|
|
||||||
+ if (TransB == CblasTrans)
|
|
||||||
+ transb = 1;
|
|
||||||
+
|
|
||||||
+ if (TransB == CblasConjNoTrans)
|
|
||||||
+ transb = 0;
|
|
||||||
+ if (TransB == CblasConjTrans)
|
|
||||||
+ transb = 1;
|
|
||||||
+
|
|
||||||
+ a = (void *)A;
|
|
||||||
+ b = (void *)B;
|
|
||||||
+ lda = LDA;
|
|
||||||
+ ldb = LDB;
|
|
||||||
+
|
|
||||||
+ info = -1;
|
|
||||||
+
|
|
||||||
+ blasint nrowa;
|
|
||||||
+ blasint nrowb;
|
|
||||||
+ nrowa = m;
|
|
||||||
+ if (transa & 1) nrowa = k;
|
|
||||||
+ nrowb = k;
|
|
||||||
+ if (transb & 1) nrowb = m;
|
|
||||||
+
|
|
||||||
+ if (ldc < MAX(1, m))
|
|
||||||
+ info = 13;
|
|
||||||
+ if (ldb < MAX(1, nrowb))
|
|
||||||
+ info = 10;
|
|
||||||
+ if (lda < MAX(1, nrowa))
|
|
||||||
+ info = 8;
|
|
||||||
+ if (k < 0)
|
|
||||||
+ info = 5;
|
|
||||||
+ if (m < 0)
|
|
||||||
+ info = 4;
|
|
||||||
+ if (transb < 0)
|
|
||||||
+ info = 3;
|
|
||||||
+ if (transa < 0)
|
|
||||||
+ info = 2;
|
|
||||||
+ if (uplo < 0)
|
|
||||||
+ info = 1;
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+ if (order == CblasRowMajor) {
|
|
||||||
+
|
|
||||||
+ a = (void *)B;
|
|
||||||
+ b = (void *)A;
|
|
||||||
+
|
|
||||||
+ lda = LDB;
|
|
||||||
+ ldb = LDA;
|
|
||||||
+
|
|
||||||
+ if (Uplo == CblasUpper) uplo = 0;
|
|
||||||
+ if (Uplo == CblasLower) uplo = 1;
|
|
||||||
+
|
|
||||||
+ if (TransB == CblasNoTrans)
|
|
||||||
+ transa = 0;
|
|
||||||
+ if (TransB == CblasTrans)
|
|
||||||
+ transa = 1;
|
|
||||||
+
|
|
||||||
+ if (TransB == CblasConjNoTrans)
|
|
||||||
+ transa = 0;
|
|
||||||
+ if (TransB == CblasConjTrans)
|
|
||||||
+ transa = 1;
|
|
||||||
+
|
|
||||||
+ if (TransA == CblasNoTrans)
|
|
||||||
+ transb = 0;
|
|
||||||
+ if (TransA == CblasTrans)
|
|
||||||
+ transb = 1;
|
|
||||||
+
|
|
||||||
+ if (TransA == CblasConjNoTrans)
|
|
||||||
+ transb = 0;
|
|
||||||
+ if (TransA == CblasConjTrans)
|
|
||||||
+ transb = 1;
|
|
||||||
+
|
|
||||||
+ info = -1;
|
|
||||||
+
|
|
||||||
+ blasint ncola;
|
|
||||||
+ blasint ncolb;
|
|
||||||
+
|
|
||||||
+ ncola = m;
|
|
||||||
+ if (transa & 1) ncola = k;
|
|
||||||
+ ncolb = k;
|
|
||||||
+
|
|
||||||
+ if (transb & 1) {
|
|
||||||
+ ncolb = m;
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+ if (ldc < MAX(1,m))
|
|
||||||
+ info = 13;
|
|
||||||
+ if (ldb < MAX(1, ncolb))
|
|
||||||
+ info = 8;
|
|
||||||
+ if (lda < MAX(1, ncola))
|
|
||||||
+ info = 10;
|
|
||||||
+ if (k < 0)
|
|
||||||
+ info = 5;
|
|
||||||
+ if (m < 0)
|
|
||||||
+ info = 4;
|
|
||||||
+ if (transb < 0)
|
|
||||||
+ info = 2;
|
|
||||||
+ if (transa < 0)
|
|
||||||
+ info = 3;
|
|
||||||
+ if (uplo < 0)
|
|
||||||
+ info = 1;
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+ if (info >= 0) {
|
|
||||||
+ BLASFUNC(xerbla) (ERROR_NAME, &info, sizeof(ERROR_NAME));
|
|
||||||
+ return;
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+#endif
|
|
||||||
+ int buffer_size;
|
|
||||||
+ blasint i, j;
|
|
||||||
+
|
|
||||||
+#ifdef SMP
|
|
||||||
+ int nthreads;
|
|
||||||
+#endif
|
|
||||||
+
|
|
||||||
+
|
|
||||||
+#ifdef SMP
|
|
||||||
+ static int (*gemv_thread[]) (BLASLONG, BLASLONG, FLOAT, IFLOAT *,
|
|
||||||
+ BLASLONG, IFLOAT *, BLASLONG, FLOAT,
|
|
||||||
+ FLOAT *, BLASLONG, int) = {
|
|
||||||
+ sbgemv_thread_n, sbgemv_thread_t,
|
|
||||||
+ };
|
|
||||||
+#endif
|
|
||||||
+ int (*gemv[]) (BLASLONG, BLASLONG, FLOAT, IFLOAT *, BLASLONG,
|
|
||||||
+ IFLOAT *, BLASLONG, FLOAT, FLOAT *, BLASLONG) = {
|
|
||||||
+ SBGEMV_N, SBGEMV_T,};
|
|
||||||
+
|
|
||||||
+
|
|
||||||
+ if (m == 0)
|
|
||||||
+ return;
|
|
||||||
+
|
|
||||||
+ IDEBUG_START;
|
|
||||||
+
|
|
||||||
+ const blasint incb = ((transb & 1) == 0) ? 1 : ldb;
|
|
||||||
+
|
|
||||||
+ if (uplo == 1) {
|
|
||||||
+ for (i = 0; i < m; i++) {
|
|
||||||
+ j = m - i;
|
|
||||||
+
|
|
||||||
+ aa = a + i;
|
|
||||||
+ bb = b + i * ldb;
|
|
||||||
+ if (transa & 1) {
|
|
||||||
+ aa = a + lda * i;
|
|
||||||
+ }
|
|
||||||
+ if (transb & 1)
|
|
||||||
+ bb = b + i;
|
|
||||||
+ cc = c + i * ldc + i;
|
|
||||||
+
|
|
||||||
+#if 0
|
|
||||||
+ if (beta != ONE)
|
|
||||||
+ SCAL_K(l, 0, 0, beta, cc, 1, NULL, 0, NULL, 0);
|
|
||||||
+
|
|
||||||
+ if (alpha == ZERO)
|
|
||||||
+ continue;
|
|
||||||
+#endif
|
|
||||||
+
|
|
||||||
+ IDEBUG_START;
|
|
||||||
+
|
|
||||||
+ buffer_size = j + k + 128 / sizeof(FLOAT);
|
|
||||||
+#ifdef WINDOWS_ABI
|
|
||||||
+ buffer_size += 160 / sizeof(FLOAT);
|
|
||||||
+#endif
|
|
||||||
+ // for alignment
|
|
||||||
+ buffer_size = (buffer_size + 3) & ~3;
|
|
||||||
+ STACK_ALLOC(buffer_size, IFLOAT, buffer);
|
|
||||||
+
|
|
||||||
+#ifdef SMP
|
|
||||||
+
|
|
||||||
+ if (1L * j * k < 2304L * GEMM_MULTITHREAD_THRESHOLD)
|
|
||||||
+ nthreads = 1;
|
|
||||||
+ else
|
|
||||||
+ nthreads = num_cpu_avail(2);
|
|
||||||
+
|
|
||||||
+ if (nthreads == 1) {
|
|
||||||
+#endif
|
|
||||||
+
|
|
||||||
+ if (!(transa & 1))
|
|
||||||
+ (gemv[(int)transa]) (j, k, alpha, aa, lda,
|
|
||||||
+ bb, incb, beta, cc, 1);
|
|
||||||
+ else
|
|
||||||
+ (gemv[(int)transa]) (k, j, alpha, aa, lda,
|
|
||||||
+ bb, incb, beta, cc, 1);
|
|
||||||
+
|
|
||||||
+#ifdef SMP
|
|
||||||
+ } else {
|
|
||||||
+ if (!(transa & 1))
|
|
||||||
+ (gemv_thread[(int)transa]) (j, k, alpha, aa,
|
|
||||||
+ lda, bb, incb, beta, cc,
|
|
||||||
+ 1, nthreads);
|
|
||||||
+ else
|
|
||||||
+ (gemv_thread[(int)transa]) (k, j, alpha, aa,
|
|
||||||
+ lda, bb, incb, beta, cc,
|
|
||||||
+ 1, nthreads);
|
|
||||||
+
|
|
||||||
+ }
|
|
||||||
+#endif
|
|
||||||
+
|
|
||||||
+ STACK_FREE(buffer);
|
|
||||||
+ }
|
|
||||||
+ } else {
|
|
||||||
+
|
|
||||||
+ for (i = 0; i < m; i++) {
|
|
||||||
+ j = i + 1;
|
|
||||||
+
|
|
||||||
+ bb = b + i * ldb;
|
|
||||||
+ if (transb & 1) {
|
|
||||||
+ bb = b + i;
|
|
||||||
+ }
|
|
||||||
+ cc = c + i * ldc;
|
|
||||||
+
|
|
||||||
+#if 0
|
|
||||||
+ if (beta != ONE)
|
|
||||||
+ SCAL_K(l, 0, 0, beta, cc, 1, NULL, 0, NULL, 0);
|
|
||||||
+
|
|
||||||
+ if (alpha == ZERO)
|
|
||||||
+ continue;
|
|
||||||
+#endif
|
|
||||||
+ IDEBUG_START;
|
|
||||||
+
|
|
||||||
+ buffer_size = j + k + 128 / sizeof(FLOAT);
|
|
||||||
+#ifdef WINDOWS_ABI
|
|
||||||
+ buffer_size += 160 / sizeof(FLOAT);
|
|
||||||
+#endif
|
|
||||||
+ // for alignment
|
|
||||||
+ buffer_size = (buffer_size + 3) & ~3;
|
|
||||||
+ STACK_ALLOC(buffer_size, IFLOAT, buffer);
|
|
||||||
+
|
|
||||||
+#ifdef SMP
|
|
||||||
+
|
|
||||||
+ if (1L * j * k < 2304L * GEMM_MULTITHREAD_THRESHOLD)
|
|
||||||
+ nthreads = 1;
|
|
||||||
+ else
|
|
||||||
+ nthreads = num_cpu_avail(2);
|
|
||||||
+
|
|
||||||
+ if (nthreads == 1) {
|
|
||||||
+#endif
|
|
||||||
+
|
|
||||||
+ if (!(transa & 1))
|
|
||||||
+ (gemv[(int)transa]) (j, k, alpha, a, lda, bb,
|
|
||||||
+ incb, beta, cc, 1);
|
|
||||||
+ else
|
|
||||||
+ (gemv[(int)transa]) (k, j, alpha, a, lda, bb,
|
|
||||||
+ incb, beta, cc, 1);
|
|
||||||
+
|
|
||||||
+#ifdef SMP
|
|
||||||
+ } else {
|
|
||||||
+ if (!(transa & 1))
|
|
||||||
+ (gemv_thread[(int)transa]) (j, k, alpha, a, lda,
|
|
||||||
+ bb, incb, beta, cc, 1,
|
|
||||||
+ nthreads);
|
|
||||||
+ else
|
|
||||||
+ (gemv_thread[(int)transa]) (k, j, alpha, a, lda,
|
|
||||||
+ bb, incb, beta, cc, 1,
|
|
||||||
+ nthreads);
|
|
||||||
+ }
|
|
||||||
+#endif
|
|
||||||
+
|
|
||||||
+ STACK_FREE(buffer);
|
|
||||||
+ }
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+ IDEBUG_END;
|
|
||||||
+
|
|
||||||
+ return;
|
|
||||||
+}
|
|
||||||
--
|
|
||||||
2.41.0
|
|
||||||
|
|
||||||
From 9a4c2d61a345866e4540f9d6da87eb881419b411 Mon Sep 17 00:00:00 2001
|
|
||||||
From: Honza Horak <hhorak@redhat.com>
|
|
||||||
Date: Fri, 9 Feb 2024 09:54:52 +0100
|
|
||||||
Subject: [PATCH 3/6] fix type conversion warnings
|
|
||||||
|
|
||||||
upstream commit:
|
|
||||||
|
|
||||||
commit fb99fc2e6e4ec8ecdcfffe1ca1aeb787464d2825
|
|
||||||
Author: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
|
||||||
Date: Wed Feb 7 13:42:08 2024 +0100
|
|
||||||
|
|
||||||
fix type conversion warnings
|
|
||||||
---
|
|
||||||
test/compare_sgemm_sbgemm.c | 18 ++++++++++++++----
|
|
||||||
1 file changed, 14 insertions(+), 4 deletions(-)
|
|
||||||
|
|
||||||
diff --git a/test/compare_sgemm_sbgemm.c b/test/compare_sgemm_sbgemm.c
|
|
||||||
index cf808b56d..4afa8bf93 100644
|
|
||||||
--- a/test/compare_sgemm_sbgemm.c
|
|
||||||
+++ b/test/compare_sgemm_sbgemm.c
|
|
||||||
@@ -81,6 +81,16 @@ float16to32 (bfloat16_bits f16)
|
|
||||||
return f32.v;
|
|
||||||
}
|
|
||||||
|
|
||||||
+float
|
|
||||||
+float32to16 (float32_bits f32)
|
|
||||||
+{
|
|
||||||
+ bfloat16_bits f16;
|
|
||||||
+ f16.bits.s = f32.bits.s;
|
|
||||||
+ f16.bits.e = f32.bits.e;
|
|
||||||
+ f16.bits.m = (uint32_t) f32.bits.m >> 16;
|
|
||||||
+ return f32.v;
|
|
||||||
+}
|
|
||||||
+
|
|
||||||
int
|
|
||||||
main (int argc, char *argv[])
|
|
||||||
{
|
|
||||||
@@ -108,16 +118,16 @@ main (int argc, char *argv[])
|
|
||||||
A[j * k + i] = ((FLOAT) rand () / (FLOAT) RAND_MAX) + 0.5;
|
|
||||||
B[j * k + i] = ((FLOAT) rand () / (FLOAT) RAND_MAX) + 0.5;
|
|
||||||
C[j * k + i] = 0;
|
|
||||||
- AA[j * k + i].v = *(uint32_t *) & A[j * k + i] >> 16;
|
|
||||||
- BB[j * k + i].v = *(uint32_t *) & B[j * k + i] >> 16;
|
|
||||||
+ AA[j * k + i].v = float32to16( A[j * k + i] );
|
|
||||||
+ BB[j * k + i].v = float32to16( B[j * k + i] );
|
|
||||||
CC[j * k + i] = 0;
|
|
||||||
DD[j * k + i] = 0;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
SGEMM (&transA, &transB, &m, &n, &k, &alpha, A,
|
|
||||||
&m, B, &k, &beta, C, &m);
|
|
||||||
- SBGEMM (&transA, &transB, &m, &n, &k, &alpha, AA,
|
|
||||||
- &m, BB, &k, &beta, CC, &m);
|
|
||||||
+ SBGEMM (&transA, &transB, &m, &n, &k, &alpha, (bfloat16*) AA,
|
|
||||||
+ &m, (bfloat16*)BB, &k, &beta, CC, &m);
|
|
||||||
for (i = 0; i < n; i++)
|
|
||||||
for (j = 0; j < m; j++)
|
|
||||||
if (fabs (CC[i * m + j] - C[i * m + j]) > 1.0)
|
|
||||||
--
|
|
||||||
2.41.0
|
|
||||||
|
|
||||||
From 5593507ddbd5d35d088cd4db6285de6b9d84a405 Mon Sep 17 00:00:00 2001
|
|
||||||
From: Honza Horak <hhorak@redhat.com>
|
|
||||||
Date: Fri, 9 Feb 2024 09:56:11 +0100
|
|
||||||
Subject: [PATCH 4/6] fix prototype for c/zaxpby
|
|
||||||
|
|
||||||
Upstream commit:
|
|
||||||
|
|
||||||
commit b3fa16345d83b723b8984b78dc6a2bb5d9f3d479
|
|
||||||
Author: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
|
||||||
Date: Thu Feb 8 13:15:34 2024 +0100
|
|
||||||
|
|
||||||
fix prototype for c/zaxpby
|
|
||||||
---
|
|
||||||
common_interface.h | 4 ++--
|
|
||||||
1 file changed, 2 insertions(+), 2 deletions(-)
|
|
||||||
|
|
||||||
diff --git a/common_interface.h b/common_interface.h
|
|
||||||
index 318827920..1f6cb5f6d 100644
|
|
||||||
--- a/common_interface.h
|
|
||||||
+++ b/common_interface.h
|
|
||||||
@@ -764,8 +764,8 @@ xdouble BLASFUNC(qlamc3)(xdouble *, xdouble *);
|
|
||||||
|
|
||||||
void BLASFUNC(saxpby) (blasint *, float *, float *, blasint *, float *, float *, blasint *);
|
|
||||||
void BLASFUNC(daxpby) (blasint *, double *, double *, blasint *, double *, double *, blasint *);
|
|
||||||
-void BLASFUNC(caxpby) (blasint *, float *, float *, blasint *, float *, float *, blasint *);
|
|
||||||
-void BLASFUNC(zaxpby) (blasint *, double *, double *, blasint *, double *, double *, blasint *);
|
|
||||||
+void BLASFUNC(caxpby) (blasint *, void *, float *, blasint *, void *, float *, blasint *);
|
|
||||||
+void BLASFUNC(zaxpby) (blasint *, void *, double *, blasint *, void *, double *, blasint *);
|
|
||||||
|
|
||||||
void BLASFUNC(somatcopy) (char *, char *, blasint *, blasint *, float *, float *, blasint *, float *, blasint *);
|
|
||||||
void BLASFUNC(domatcopy) (char *, char *, blasint *, blasint *, double *, double *, blasint *, double *, blasint *);
|
|
||||||
--
|
|
||||||
2.41.0
|
|
||||||
|
|
||||||
From 42b30ed2c54034b2b1dbb15bb9e3e705e704b6a9 Mon Sep 17 00:00:00 2001
|
|
||||||
From: Honza Horak <hhorak@redhat.com>
|
|
||||||
Date: Fri, 9 Feb 2024 09:56:46 +0100
|
|
||||||
Subject: [PATCH 5/6] fix incompatible pointer types
|
|
||||||
|
|
||||||
Upstream commit:
|
|
||||||
|
|
||||||
commit 500ac4de5e20596d5cd797d745db97dd0a62ff86
|
|
||||||
Author: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
|
||||||
Date: Thu Feb 8 13:18:34 2024 +0100
|
|
||||||
|
|
||||||
fix incompatible pointer types
|
|
||||||
---
|
|
||||||
interface/zaxpby.c | 4 +++-
|
|
||||||
1 file changed, 3 insertions(+), 1 deletion(-)
|
|
||||||
|
|
||||||
diff --git a/interface/zaxpby.c b/interface/zaxpby.c
|
|
||||||
index 3a4db7403..e5065270d 100644
|
|
||||||
--- a/interface/zaxpby.c
|
|
||||||
+++ b/interface/zaxpby.c
|
|
||||||
@@ -39,12 +39,14 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
||||||
|
|
||||||
#ifndef CBLAS
|
|
||||||
|
|
||||||
-void NAME(blasint *N, FLOAT *ALPHA, FLOAT *x, blasint *INCX, FLOAT *BETA, FLOAT *y, blasint *INCY)
|
|
||||||
+void NAME(blasint *N, void *VALPHA, FLOAT *x, blasint *INCX, void *VBETA, FLOAT *y, blasint *INCY)
|
|
||||||
{
|
|
||||||
|
|
||||||
blasint n = *N;
|
|
||||||
blasint incx = *INCX;
|
|
||||||
blasint incy = *INCY;
|
|
||||||
+ FLOAT* ALPHA = (FLOAT*) VALPHA;
|
|
||||||
+ FLOAT* BETA = (FLOAT*) VBETA;
|
|
||||||
|
|
||||||
#else
|
|
||||||
|
|
||||||
--
|
|
||||||
2.41.0
|
|
||||||
|
|
||||||
From 1c525b6e704523912a04fbd026300a2ff95341f3 Mon Sep 17 00:00:00 2001
|
|
||||||
From: Honza Horak <hhorak@redhat.com>
|
|
||||||
Date: Fri, 9 Feb 2024 15:29:17 +0100
|
|
||||||
Subject: [PATCH 6/6] fix sbgemm bfloat16 conversion errors introduced in PR
|
|
||||||
4488
|
|
||||||
|
|
||||||
Upstream commit:
|
|
||||||
|
|
||||||
commit e9f480111e1d5b6f69c8053f79375b0a4242712f
|
|
||||||
Author: Martin Kroeker <martin@ruby.chemie.uni-freiburg.de>
|
|
||||||
Date: Wed Feb 7 19:57:18 2024 +0100
|
|
||||||
|
|
||||||
fix sbgemm bfloat16 conversion errors introduced in PR 4488
|
|
||||||
---
|
|
||||||
test/compare_sgemm_sbgemm.c | 18 ++++++------------
|
|
||||||
1 file changed, 6 insertions(+), 12 deletions(-)
|
|
||||||
|
|
||||||
diff --git a/test/compare_sgemm_sbgemm.c b/test/compare_sgemm_sbgemm.c
|
|
||||||
index 4afa8bf93..bc74233ab 100644
|
|
||||||
--- a/test/compare_sgemm_sbgemm.c
|
|
||||||
+++ b/test/compare_sgemm_sbgemm.c
|
|
||||||
@@ -81,16 +81,6 @@ float16to32 (bfloat16_bits f16)
|
|
||||||
return f32.v;
|
|
||||||
}
|
|
||||||
|
|
||||||
-float
|
|
||||||
-float32to16 (float32_bits f32)
|
|
||||||
-{
|
|
||||||
- bfloat16_bits f16;
|
|
||||||
- f16.bits.s = f32.bits.s;
|
|
||||||
- f16.bits.e = f32.bits.e;
|
|
||||||
- f16.bits.m = (uint32_t) f32.bits.m >> 16;
|
|
||||||
- return f32.v;
|
|
||||||
-}
|
|
||||||
-
|
|
||||||
int
|
|
||||||
main (int argc, char *argv[])
|
|
||||||
{
|
|
||||||
@@ -110,6 +100,8 @@ main (int argc, char *argv[])
|
|
||||||
float C[m * n];
|
|
||||||
bfloat16_bits AA[m * k], BB[k * n];
|
|
||||||
float DD[m * n], CC[m * n];
|
|
||||||
+ bfloat16 atmp,btmp;
|
|
||||||
+ blasint one=1;
|
|
||||||
|
|
||||||
for (j = 0; j < m; j++)
|
|
||||||
{
|
|
||||||
@@ -118,8 +110,10 @@ main (int argc, char *argv[])
|
|
||||||
A[j * k + i] = ((FLOAT) rand () / (FLOAT) RAND_MAX) + 0.5;
|
|
||||||
B[j * k + i] = ((FLOAT) rand () / (FLOAT) RAND_MAX) + 0.5;
|
|
||||||
C[j * k + i] = 0;
|
|
||||||
- AA[j * k + i].v = float32to16( A[j * k + i] );
|
|
||||||
- BB[j * k + i].v = float32to16( B[j * k + i] );
|
|
||||||
+ sbstobf16_(&one, &A[j*k+i], &one, &atmp, &one);
|
|
||||||
+ sbstobf16_(&one, &B[j*k+i], &one, &btmp, &one);
|
|
||||||
+ AA[j * k + i].v = atmp;
|
|
||||||
+ BB[j * k + i].v = btmp;
|
|
||||||
CC[j * k + i] = 0;
|
|
||||||
DD[j * k + i] = 0;
|
|
||||||
}
|
|
||||||
--
|
|
||||||
2.41.0
|
|
||||||
|
|
@ -1,8 +0,0 @@
|
|||||||
summary: CI plan, picks Tier1 tests, runs in beakerlib.
|
|
||||||
discover:
|
|
||||||
- name: fedora
|
|
||||||
how: fmf
|
|
||||||
filter: 'tier: 1'
|
|
||||||
url: https://src.fedoraproject.org/tests/openblas.git
|
|
||||||
execute:
|
|
||||||
how: tmt
|
|
Loading…
Reference in New Issue
Block a user