Spaces:
Runtime error
Runtime error
#/****************************************************************************** | |
# * Copyright (c) 2011, Duane Merrill. All rights reserved. | |
# * Copyright (c) 2011-2018, NVIDIA CORPORATION. All rights reserved. | |
# * | |
# * Redistribution and use in source and binary forms, with or without | |
# * modification, are permitted provided that the following conditions are met: | |
# * * Redistributions of source code must retain the above copyright | |
# * notice, this list of conditions and the following disclaimer. | |
# * * Redistributions in binary form must reproduce the above copyright | |
# * notice, this list of conditions and the following disclaimer in the | |
# * documentation and/or other materials provided with the distribution. | |
# * * Neither the name of the NVIDIA CORPORATION nor the | |
# * names of its contributors may be used to endorse or promote products | |
# * derived from this software without specific prior written permission. | |
# * | |
# * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND | |
# * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | |
# * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE | |
# * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY | |
# * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | |
# * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | |
# * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | |
# * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | |
# * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | |
# * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |
# * | |
#******************************************************************************/ | |
#------------------------------------------------------------------------------- | |
# Commandline Options | |
#------------------------------------------------------------------------------- | |
# [sm=<XXX,...>] Compute-capability to compile for, e.g., "sm=200,300,350" (SM20 by default). | |
COMMA = , | |
ifdef sm | |
SM_ARCH = $(subst $(COMMA),-,$(sm)) | |
else | |
SM_ARCH = 600 | |
endif | |
ifeq (700, $(findstring 700, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_70,code=\"sm_70,compute_70\" | |
SM_DEF += -DSM700 | |
TEST_ARCH = 700 | |
endif | |
ifeq (620, $(findstring 620, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_62,code=\"sm_62,compute_62\" | |
SM_DEF += -DSM620 | |
TEST_ARCH = 620 | |
endif | |
ifeq (610, $(findstring 610, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_61,code=\"sm_61,compute_61\" | |
SM_DEF += -DSM610 | |
TEST_ARCH = 610 | |
endif | |
ifeq (600, $(findstring 600, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_60,code=\"sm_60,compute_60\" | |
SM_DEF += -DSM600 | |
TEST_ARCH = 600 | |
endif | |
ifeq (520, $(findstring 520, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_52,code=\"sm_52,compute_52\" | |
SM_DEF += -DSM520 | |
TEST_ARCH = 520 | |
endif | |
ifeq (370, $(findstring 370, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_37,code=\"sm_37,compute_37\" | |
SM_DEF += -DSM370 | |
TEST_ARCH = 370 | |
endif | |
ifeq (350, $(findstring 350, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_35,code=\"sm_35,compute_35\" | |
SM_DEF += -DSM350 | |
TEST_ARCH = 350 | |
endif | |
ifeq (300, $(findstring 300, $(SM_ARCH))) | |
SM_TARGETS += -gencode=arch=compute_30,code=\"sm_30,compute_30\" | |
SM_DEF += -DSM300 | |
TEST_ARCH = 300 | |
endif | |
# [cdp=<0|1>] CDP enable option (default: no) | |
ifeq ($(cdp), 1) | |
DEFINES += -DCUB_CDP | |
CDP_SUFFIX = cdp | |
NVCCFLAGS += -rdc=true -lcudadevrt | |
else | |
CDP_SUFFIX = nocdp | |
endif | |
# [force32=<0|1>] Device addressing mode option (64-bit device pointers by default) | |
ifeq ($(force32), 1) | |
CPU_ARCH = -m32 | |
CPU_ARCH_SUFFIX = i386 | |
else | |
CPU_ARCH = -m64 | |
CPU_ARCH_SUFFIX = x86_64 | |
NPPI = -lnppist | |
endif | |
# [abi=<0|1>] CUDA ABI option (enabled by default) | |
ifneq ($(abi), 0) | |
ABI_SUFFIX = abi | |
else | |
NVCCFLAGS += -Xptxas -abi=no | |
ABI_SUFFIX = noabi | |
endif | |
# [open64=<0|1>] Middle-end compiler option (nvvm by default) | |
ifeq ($(open64), 1) | |
NVCCFLAGS += -open64 | |
PTX_SUFFIX = open64 | |
else | |
PTX_SUFFIX = nvvm | |
endif | |
# [verbose=<0|1>] Verbose toolchain output from nvcc option | |
ifeq ($(verbose), 1) | |
NVCCFLAGS += -v | |
endif | |
# [keep=<0|1>] Keep intermediate compilation artifacts option | |
ifeq ($(keep), 1) | |
NVCCFLAGS += -keep | |
endif | |
# [debug=<0|1>] Generate debug mode code | |
ifeq ($(debug), 1) | |
NVCCFLAGS += -G | |
endif | |
#------------------------------------------------------------------------------- | |
# Compiler and compilation platform | |
#------------------------------------------------------------------------------- | |
CUB_DIR = $(dir $(lastword $(MAKEFILE_LIST))) | |
NVCC ?= "$(shell which nvcc)" | |
ifdef nvccver | |
NVCC_VERSION = $(nvccver) | |
else | |
NVCC_VERSION = $(strip $(shell nvcc --version | grep release | sed 's/.*release //' | sed 's/,.*//')) | |
endif | |
# detect OS | |
OSUPPER = $(shell uname -s 2>/dev/null | tr [:lower:] [:upper:]) | |
# Default flags: verbose kernel properties (regs, smem, cmem, etc.); runtimes for compilation phases | |
NVCCFLAGS += $(SM_DEF) -Xptxas -v -Xcudafe -\# | |
ifeq (WIN_NT, $(findstring WIN_NT, $(OSUPPER))) | |
# For MSVC | |
# Enable more warnings and treat as errors | |
NVCCFLAGS += -Xcompiler /W3 -Xcompiler /WX | |
# Disable excess x86 floating point precision that can lead to results being labeled incorrectly | |
NVCCFLAGS += -Xcompiler /fp:strict | |
# Help the compiler/linker work with huge numbers of kernels on Windows | |
NVCCFLAGS += -Xcompiler /bigobj -Xcompiler /Zm500 | |
CC = cl | |
# Multithreaded runtime | |
NVCCFLAGS += -Xcompiler /MT | |
ifneq ($(force32), 1) | |
CUDART_CYG = "$(shell dirname $(NVCC))/../lib/Win32/cudart.lib" | |
else | |
CUDART_CYG = "$(shell dirname $(NVCC))/../lib/x64/cudart.lib" | |
endif | |
CUDART = "$(shell cygpath -w $(CUDART_CYG))" | |
else | |
# For g++ | |
# Disable excess x86 floating point precision that can lead to results being labeled incorrectly | |
NVCCFLAGS += -Xcompiler -ffloat-store | |
CC = g++ | |
ifneq ($(force32), 1) | |
CUDART = "$(shell dirname $(NVCC))/../lib/libcudart_static.a" | |
else | |
CUDART = "$(shell dirname $(NVCC))/../lib64/libcudart_static.a" | |
endif | |
endif | |
# Suffix to append to each binary | |
BIN_SUFFIX = sm$(SM_ARCH)_$(PTX_SUFFIX)_$(NVCC_VERSION)_$(ABI_SUFFIX)_$(CDP_SUFFIX)_$(CPU_ARCH_SUFFIX) | |
#------------------------------------------------------------------------------- | |
# Dependency Lists | |
#------------------------------------------------------------------------------- | |
rwildcard=$(foreach d,$(wildcard $1*),$(call rwildcard,$d/,$2) $(filter $(subst *,%,$2),$d)) | |
CUB_DEPS = $(call rwildcard, $(CUB_DIR),*.cuh) \ | |
$(CUB_DIR)common.mk | |