-
Notifications
You must be signed in to change notification settings - Fork 59
/
Copy pathMakefile
92 lines (71 loc) · 2.45 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
ifndef CUDA_PREFIX
CUDA_PREFIX = /usr/local/cuda
endif
ifndef INSTALL_PREFIX
INSTALL_PREFIX=/usr/local
endif
SRC_DIR = ./src
SRCS = $(SRC_DIR)/nnet/conv_bc01_matmul.cpp \
$(SRC_DIR)/nnet/pool_b01.cpp \
$(SRC_DIR)/nnet/cudnn.cpp
CUDA_SRCS = $(SRC_DIR)/array_ops.cu \
$(SRC_DIR)/elementwise.cu \
$(SRC_DIR)/reduction.cu \
$(SRC_DIR)/blas.cu \
$(SRC_DIR)/random.cu \
$(SRC_DIR)/image/img2win.cu \
$(SRC_DIR)/image/rescale.cu \
$(SRC_DIR)/nnet/one_hot.cu
INCLUDE_DIRS = ./include
INCLUDE_DIRS += $(CUDA_PREFIX)/include
ifneq ($(wildcard $(CUDA_PREFIX)/lib64),)
# Use lib64 if it exists
LIB_DIRS += $(CUDA_PREFIX)/lib64
endif
LIB_DIRS += $(CUDA_PREFIX)/lib
LIBS += cudart cublas cufft curand
ifeq ($(CUDNN_ENABLED), 1)
C_FLAGS += -DCUDNN_ENABLED
LIBS += cudnn
endif
ifndef CUDA_ARCH
# By default, libcudarray is built for a range of different CUDA
# architectures. You can speed up compilation time by selecting only the
# architecture for your GPU.
CUDA_ARCH = -gencode arch=compute_20,code=sm_20 \
-gencode arch=compute_20,code=compute_20 \
-gencode arch=compute_30,code=sm_30 \
-gencode arch=compute_30,code=compute_30 \
-gencode arch=compute_35,code=sm_35 \
-gencode arch=compute_35,code=compute_35
endif
export PATH := $(CUDA_PREFIX)/bin:$(PATH)
CXX = g++
NVCC = nvcc
BUILD_DIR = ./build
OBJS = $(SRCS:.cpp=.o) $(CUDA_SRCS:.cu=.o)
LIBCUDARRAY = libcudarray.so
LIBCUDARRAY_BUILD = $(BUILD_DIR)/$(LIBCUDARRAY)
LIBCUDARRAY_INSTALL = $(INSTALL_PREFIX)/lib/$(LIBCUDARRAY)
INCLUDES += $(foreach include_dir,$(INCLUDE_DIRS),-I$(include_dir))
C_FLAGS += -O3 -fPIC -Wall -Wfatal-errors -D_FORCE_INLINES
NVCC_FLAGS = $(CUDA_ARCH) -O3 --compiler-options '$(C_FLAGS)' \
--ftz=true --prec-div=false -prec-sqrt=false --fmad=true
LDFLAGS += $(foreach lib_dir,$(LIB_DIRS),-L$(lib_dir)) \
$(foreach lib,$(LIBS),-l$(lib))
$(LIBCUDARRAY_BUILD) : $(OBJS)
mkdir -p $(BUILD_DIR)
$(CXX) -shared $(C_FLAGS) -o $@ $^ $(LDFLAGS)
%.o : %.cpp
$(CXX) $(C_FLAGS) $(INCLUDES) -c -o $@ $<
%.o : %.cu
$(NVCC) $(NVCC_FLAGS) $(INCLUDES) -c -o $@ $<
all: $(LIBCUDARRAY_BUILD)
$(LIBCUDARRAY_INSTALL) : $(LIBCUDARRAY_BUILD)
cp $(LIBCUDARRAY_BUILD) $(LIBCUDARRAY_INSTALL)
install: $(INSTALL_PREFIX)/lib/$(LIBCUDARRAY)
uninstall:
rm $(LIBCUDARRAY_INSTALL)
.PHONY: clean
clean:
rm -f $(OBJS) $(LIBCUDARRAY_BUILD)