Skip to content
Snippets Groups Projects
Commit 2362ee08 authored by Paul McCarthy's avatar Paul McCarthy :mountain_bicyclist:
Browse files

BF,RF: Fix linux CFLAGS default assignment.

Always add -fPIC on all platforms.

For NVCC, use same variable naming conventions as used in conda-forge build
env.

Use -ccbin rather than --compiler-bindir (they are equivalent), as the
conda-forge nvcc wrapper only checks for the former.

Fix path to supportedGencodes.sh script.
parent 043fe3a2
No related branches found
No related tags found
1 merge request!7Rf/cuda
...@@ -39,10 +39,10 @@ TCLSH ?= ${FSLDIR}/bin/fsltclsh ...@@ -39,10 +39,10 @@ TCLSH ?= ${FSLDIR}/bin/fsltclsh
# environment. # environment.
# Compiler flags for C projects # Compiler flags for C projects
ARCHCFLAGS = -std=c99 ARCHCFLAGS = -std=c99 -fPIC
# Compiler flags for C++ projects. # Compiler flags for C++ projects.
ARCHCXXFLAGS = -std=c++11 ARCHCXXFLAGS = -std=c++11 -fPIC
# Preprocesor flags for C/C++ projects. # Preprocesor flags for C/C++ projects.
ARCHCPPFLAGS = ARCHCPPFLAGS =
...@@ -54,9 +54,11 @@ ARCHLDFLAGS = ...@@ -54,9 +54,11 @@ ARCHLDFLAGS =
ARCHLIBS = ARCHLIBS =
# Compiler flags for CUDA projects. # Compiler flags for CUDA projects.
# This is set in the nvcc block below.
ARCHNVCCFLAGS = ARCHNVCCFLAGS =
# Linker flags for CUDA projects. # Linker flags for CUDA projects.
# This is set in the nvcc block below.
ARCHNVCCLDFLAGS = ARCHNVCCLDFLAGS =
# Allow flags to be provided by the environment. # Allow flags to be provided by the environment.
...@@ -77,8 +79,8 @@ ifeq ($(SYSTYPE), Darwin) ...@@ -77,8 +79,8 @@ ifeq ($(SYSTYPE), Darwin)
# LDFLAGS may be overridden by the environment. # LDFLAGS may be overridden by the environment.
CC ?= clang CC ?= clang
CXX ?= clang++ CXX ?= clang++
CFLAGS ?= -arch x86_64 -Wall -pedantic -fPIC CFLAGS ?= -arch x86_64 -Wall -pedantic
CXXFLAGS ?= -arch x86_64 -Wall -pedantic -fPIC CXXFLAGS ?= -arch x86_64 -Wall -pedantic
LDFLAGS ?= -Wl,-search_paths_first LDFLAGS ?= -Wl,-search_paths_first
ARCHLIBS += -llapack -lblas -lz -lm ARCHLIBS += -llapack -lblas -lz -lm
endif endif
...@@ -95,8 +97,9 @@ ifeq ($(SYSTYPE), Linux) ...@@ -95,8 +97,9 @@ ifeq ($(SYSTYPE), Linux)
CC ?= gcc CC ?= gcc
CXX ?= g++ CXX ?= g++
CFLAGS ?= -fexpensive-optimizations \ CFLAGS ?= -fexpensive-optimizations \
-Wall -pedantic -Wno-long-long -fPIC -Wall -pedantic -Wno-long-long
CXXFLAGS ?= -fexpensive-optimizations \ CXXFLAGS ?= -fexpensive-optimizations \
-Wall -pedantic -Wno-long-long
LDFLAGS ?= -Wl,-rpath,'$$ORIGIN/../lib' LDFLAGS ?= -Wl,-rpath,'$$ORIGIN/../lib'
ARCHLIBS += -lopenblas -lz -lm ARCHLIBS += -lopenblas -lz -lm
endif # if Linux endif # if Linux
...@@ -110,10 +113,15 @@ endif # if Linux ...@@ -110,10 +113,15 @@ endif # if Linux
# CUDA/nvcc compiler options # CUDA/nvcc compiler options
ifneq ($(shell which nvcc), ) ifneq ($(shell which nvcc), )
# We specifically use variable names "CUDA_VER"
# and "CUDA_HOME" because they will be set in
# the conda-forge CUDA build environment (and
# will take precedence over these definitions
# here when they are set).
NVCC ?= nvcc NVCC ?= nvcc
CUDAVER ?= $(shell nvcc --version | grep -Po "release \K[0-9\.]+") CUDA_HOME ?= ${FSLDIR}
GENCODEFLAGS ?= $(shell ${FSLCONFDIR}/common/supportedGencodes.sh ${CUDAVER}) CUDA_VER ?= $(shell nvcc --version | grep -Po "release \K[0-9\.]+")
CUDADIR ?= ${FSLDIR} GENCODEFLAGS ?= $(shell ${FSLCONFDIR}/supportedGencodes.sh ${CUDA_VER})
# nvcc-specific tweaks: # nvcc-specific tweaks:
# - Define ARMA_ALLOW_FAKE_GCC, otherwise byte-alignment issues # - Define ARMA_ALLOW_FAKE_GCC, otherwise byte-alignment issues
...@@ -122,16 +130,18 @@ ifneq ($(shell which nvcc), ) ...@@ -122,16 +130,18 @@ ifneq ($(shell which nvcc), )
# - Do not use -pedantic, otherwise *every single line* of # - Do not use -pedantic, otherwise *every single line* of
# transpiled cuda code will trigger "warning: style of line # transpiled cuda code will trigger "warning: style of line
# directive is a GCC extension". # directive is a GCC extension".
# - Specify the compiler to use with --compiler-bindir, as nvcc # - Specify the compiler to use with -ccbin, as nvcc
# might otherwise naively call "gcc" # might otherwise naively call "gcc" (we specifically use
ARCHNVCCFLAGS = -I${CUDADIR}/include \ # "-ccbin" rather than "--compiler-bindir" here, because the
-maxrregcount=64 \ # conda-forge nvcc wrapper checks for -ccbin, and adds its own
${GENCODEFLAGS} \ # if not present).
-DARMA_ALLOW_FAKE_GCC \ ARCHNVCCFLAGS = -I${CUDA_HOME}/include \
--compiler-bindir \ -maxrregcount=64 \
$(shell which $(CC)) \ ${GENCODEFLAGS} \
--compiler-options \ -DARMA_ALLOW_FAKE_GCC \
-ccbin $(CXX) \
--compiler-options \
"$(filter-out -pedantic, ${ARCHCXXFLAGS})" "$(filter-out -pedantic, ${ARCHCXXFLAGS})"
ARCHNVCCLDFLAGS = -L${CUDADIR}/lib \ ARCHNVCCLDFLAGS = -L${CUDA_HOME}/lib \
-L${CUDADIR}/lib/stubs -L${CUDA_HOME}/lib/stubs
endif endif
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment