11#
22#
3- # BLIS
3+ # BLIS
44# An object-based framework for developing high-performance BLAS-like
55# libraries.
66#
3535
3636# Declare the name of the current configuration and add it to the
3737# running list of configurations included by common.mk.
38- THIS_CONFIG := zen3
38+ THIS_CONFIG := zen3
3939# CONFIGS_INCL += $(THIS_CONFIG)
4040
4141#
6565# they make explicit use of the rbp register.
6666CKOPTFLAGS := $(COPTFLAGS ) -fomit-frame-pointer
6767CROPTFLAGS := $(CKOPTFLAGS )
68- CKVECFLAGS := -mavx2 -mfma -mfpmath=sse
69- CRVECFLAGS := $(CKVECFLAGS ) -funsafe-math-optimizations -ffp-contract=fast
68+ CKVECFLAGS := -mavx2 -mfma
69+ CRVECFLAGS := $(CKVECFLAGS )
7070ifeq ($(CC_VENDOR ) ,gcc)
7171 ifeq ($(GCC_OT_9_1_0),yes) # gcc versions older than 9.1.
7272 CVECFLAGS_VER := -march=znver1 -mno-avx256-split-unaligned-store
@@ -77,6 +77,8 @@ ifeq ($(CC_VENDOR),gcc)
7777 CVECFLAGS_VER := -march=znver3
7878 endif
7979 endif
80+ CKVECFLAGS += -mfpmath=sse
81+ CRVECFLAGS += -funsafe-math-optimizations -ffp-contract=fast
8082else
8183ifeq ($(CC_VENDOR ) ,clang)
8284 ifeq ($(CLANG_OT_9_0_0),yes) # clang versions older than 9.0.
@@ -92,6 +94,8 @@ ifeq ($(CC_VENDOR),clang)
9294 endif
9395 endif
9496 endif
97+ CKVECFLAGS += -mfpmath=sse
98+ CRVECFLAGS += -funsafe-math-optimizations -ffp-contract=fast
9599else
96100ifeq ($(CC_VENDOR ) ,aocc)
97101 ifeq ($(AOCC_OT_2_0_0),yes) # aocc versions older than 2.0.
@@ -103,8 +107,14 @@ ifeq ($(CC_VENDOR),aocc)
103107 CVECFLAGS_VER := -march=znver3
104108 endif
105109 endif
110+ CKVECFLAGS += -mfpmath=sse
111+ CRVECFLAGS += -funsafe-math-optimizations -ffp-contract=fast
112+ ifeq ($(CC_VENDOR ) ,nvc)
113+ CVECFLAGS_VER := -march=znver3
114+ CRVECFLAGS += -fast
106115else
107- $(error gcc, clang, or aocc is required for this configuration.)
116+ $(error gcc, clang, nvc or aocc is required for this configuration.)
117+ endif
108118endif
109119endif
110120endif
@@ -114,4 +124,3 @@ CRVECFLAGS += $(CVECFLAGS_VER)
114124# Store all of the variables here to new variables containing the
115125# configuration name.
116126$(eval $(call store-make-defs,$(THIS_CONFIG)))
117-
0 commit comments