added support for K80/sm_37

This commit is contained in:
Evghenii Gaburov
2015-02-21 14:28:47 +01:00
parent 86ba817445
commit bf3b15b744
8 changed files with 38 additions and 20 deletions

View File

@@ -3,6 +3,9 @@ ISPC_SRC=ao.ispc
CU_SRC=ao.cu
CXX_SRC=ao.cpp
PTXCC_REGMAX=64
NVARCH=sm_35
#PTXCC_REGMAX=128
#NVARCH=sm_37
#ISPC_FLAGS= --opt=disable-uniform-control-flow
#LLVM_GPU=1

View File

@@ -1,21 +1,22 @@
NVCC_SRC=../../util/nvcc_helpers.cu
NVCC_OBJS=objs_ptx/nvcc_helpers_nvcc.o
NVARCH ?= sm_35
#
CXX=g++ -ffast-math
CXXFLAGS=-O3 -I$(CUDATK)/include -Iobjs_ptx/ -D_CUDA_ -I../../util -I../../
#
NVCC=nvcc
NVCC_FLAGS+=-O3 -arch=sm_35 -D_CUDA_ -I../../util -Xptxas=-v -Iobjs_ptx/
NVCC_FLAGS+=-O3 -arch=$(NVARCH) -D_CUDA_ -I../../util -Xptxas=-v -Iobjs_ptx/
ifdef PTXCC_REGMAX
NVCC_FLAGS += --maxrregcount=$(PTXCC_REGMAX)
endif
NVCC_FLAGS+=--use_fast_math
#
LD=nvcc
LDFLAGS=-lcudart -lcudadevrt -arch=sm_35
LDFLAGS=-lcudart -lcudadevrt -arch=$(NVARCH)
#
PTXCC=$(ISPC_HOME)/ptxtools/ptxcc
PTXCC_FLAGS+= -Xptxas=-v
PTXCC=$(ISPC_HOME)/ptxtools/ptxcc --arch=$(NVARCH)
PTXCC_FLAGS+= -Xptxas=-v
ifdef PTXCC_REGMAX
PTXCC_FLAGS += -maxrregcount=$(PTXCC_REGMAX)
endif
@@ -41,13 +42,13 @@ CXX_SRC+=ispc_malloc.cpp
CXX_OBJS+=objs_ptx/ispc_malloc_gcc.o
PTXGEN = $(ISPC_HOME)/ptxtools/ptxgen
PTXGEN += --use_fast_math
PTXGEN += --use_fast_math --arch=$(NVARCH)
#LLVM32=$(HOME)/usr/local/llvm/bin-3.2
#LLVM32DIS=$(LLVM32)/bin/llvm-dis
LLC=$(LLVM_ROOT)/bin/llc
LLC_FLAGS=-march=nvptx64 -mcpu=sm_35
LLC_FLAGS=-march=nvptx64 -mcpu=$(NVARCH)
# .SUFFIXES: .bc .o .cu .ll

View File

@@ -3,6 +3,7 @@ ISPC_SRC=kernels.ispc
CU_SRC=kernels.cu
CXX_SRC=common.cpp main.cpp
PTXCC_REGMAX=64
NVARCH=sm_35
NVVM_GPU=1
#LLVM_GPU=1

View File

@@ -2,10 +2,11 @@ PROG=hermite4
ISPC_SRC=hermite4.ispc
#CU_SRC=hermite4.cu
CXX_SRC=hermite4.cpp
PTXCC_REGMAX=64
PTXCC_REGMAX=128
#ISPC_FLAGS= --opt=disable-uniform-control-flow
NVARCH=sm_37
#LLVM_GPU=1
# LLVM_GPU=1
NVVM_GPU=1
include ../common_ptx.mk