-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathMakefile
235 lines (166 loc) · 6.54 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
# CURAFFT Makefile
CC = gcc
CXX = g++
NVCC = nvcc
#set based on GPU card, sm_60 (Tesla P100) or sm_61 (consumer Pascal) or sm_70 (Tesla V100, Titan V) or sm_80 (A100)
NVARCH ?= -arch=sm_80
# NVARCH ?= -gencode=arch=compute_70,code=sm_70
CFLAGS ?= -fPIC -O3 -funroll-loops -march=native
CXXFLAGS ?= $(CFLAGS) -std=c++14
NVCCFLAGS ?= -std=c++14 -ccbin=$(CXX) -O3 $(NVARCH) -Wno-deprecated-gpu-targets \
--default-stream per-thread -Xcompiler "$(CXXFLAGS)" -use_fast_math -lineinfo
# NVCCFLAGS+= -DINFO -DDEBUG -DRESULT -DTIME
# NVCCFLAGS+= -DTIME
#set your cuda path
CUDA_ROOT := /usr/local/cuda-12.1/
# Common includes
INC += -I$(CUDA_ROOT)/include -Iinclude/cuda_sample
# libs
NVCC_LIBS_PATH += -L$(CUDA_ROOT)/lib64
ifdef NVCC_STUBS
$(info detected CUDA_STUBS -- setting CUDA stubs directory)
NVCC_LIBS_PATH += -L$(NVCC_STUBS)
endif
LIBS += -lm -lcudart -lstdc++ -lnvToolsExt -lcufft -lcuda
# Include header files
INC += -I include
LIBNAME=libcurafft
DYNAMICLIB=lib/$(LIBNAME).so
STATICLIB=lib-static/$(LIBNAME).a
BINDIR=bin
HEADERS = include/curafft_opts.h include/curafft_plan.h include/cugridder.h \
include/conv_interp_invoker.h include/conv.h include/interp.h include/cuft.h include/datatype.h \
include/deconv.h include/precomp.h include/ragridder_plan.h include/utils.h include/common_utils.h \
contrib/common.h contrib/legendre_rule_fast.h contrib/utils_fp.h
# later put some file into the contrib
CONTRIBOBJS=contrib/common.o contrib/utils_fp.o
CURAFFTOBJS=contrib/legendre_rule_fast.o src/common_utils.o
CURAFFTOBJS_64=src/fourier/conv_interp_invoker.o src/fourier/conv.o src/fourier/interp.o src/fourier/cuft.o src/fourier/deconv.o \
src/astro/cugridder.o src/astro/precomp.o src/astro/ra_exec.o src/utils.o $(CONTRIBOBJS)
#ignore single precision first
CURAFFTOBJS_32=$(CURAFFTOBJS_64:%.o=%_32.o)
%_32.o: %.cpp $(HEADERS)
$(CXX) -DSINGLE -c $(CXXFLAGS) $(INC) $< -o $@
%_32.o: %.c $(HEADERS)
$(CC) -DSINGLE -c $(CFLAGS) $(INC) $< -o $@
%_32.o: %.cu $(HEADERS)
$(NVCC) -DSINGLE --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
%.o: %.cpp $(HEADERS)
$(CXX) -c $(CXXFLAGS) $(INC) $< -o $@
%.o: %.c $(HEADERS)
$(CC) -c $(CFLAGS) $(INC) $< -o $@
%.o: %.cu $(HEADERS)
$(NVCC) --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
src/%_32.o: src/%.cpp $(HEADERS)
$(CXX) -DSINGLE -c $(CXXFLAGS) $(INC) $< -o $@
src/%_32.o: src/%.c $(HEADERS)
$(CC) -DSINGLE -c $(CFLAGS) $(INC) $< -o $@
src/%_32.o: src/%.cu $(HEADERS)
$(NVCC) -DSINGLE --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
src/FT/%_32.o: src/FT/%.cu $(HEADERS)
$(NVCC) -DSINGLE --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
src/RA/%_32.o: src/FT/%.cu $(HEADERS)
$(NVCC) -DSINGLE --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
src/%.o: src/%.cpp $(HEADERS)
$(CXX) -c $(CXXFLAGS) $(INC) $< -o $@
src/%.o: src/%.c $(HEADERS)
$(CC) -c $(CFLAGS) $(INC) $< -o $@
src/%.o: src/%.cu $(HEADERS)
$(NVCC) --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
src/FT/%.o: src/FT/%.cu $(HEADERS)
$(NVCC) --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
src/RA/%.o: src/FT/%.cu $(HEADERS)
$(NVCC) --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
test/%.o: test/%.cu $(HEADERS)
$(NVCC) --device-c -c $(NVCCFLAGS) $(INC) $< -o $@
default: all
all: libtest explicit_gridder_test checkadjoint
# testers for the lib (does not execute)
libtest: lib convtest utiltest w_s_test nufft_test
convtest: $(BINDIR)/conv_2d_test \
$(BINDIR)/conv_3d_test
explicit_gridder_test: $(BINDIR)/explicit_gridder_test
utiltest: $(BINDIR)/utils_test
w_s_test: $(BINDIR)/w_s_gridder_test \
$(BINDIR)/w_s_degridder_test
nufft_test: $(BINDIR)/nufft_1d_test \
$(BINDIR)/nufft_2d_1_test \
$(BINDIR)/nufft_2d_2_test \
$(BINDIR)/nufft_1d_3_1_test \
$(BINDIR)/nufft_1d_3_2_test \
$(BINDIR)/nufft_3d_1_test
adjointness_test: $(BINDIR)/adjointness_1d_test
$(BINDIR)/%: test/%.o $(CURAFFTOBJS_64) $(CURAFFTOBJS)
mkdir -p $(BINDIR)
$(NVCC) $^ $(NVCCFLAGS) $(NVCC_LIBS_PATH) $(LIBS) -o $@
# user-facing library...
lib: $(STATICLIB) $(DYNAMICLIB)
# add $(CONTRIBOBJS) to static and dynamic later
$(STATICLIB): $(CURAFFTOBJS) $(CURAFFTOBJS_64) $(CURAFFTOBJS_32) $(CONTRIBOBJS)
mkdir -p lib-static
ar rcs $(STATICLIB) $^
$(DYNAMICLIB): $(CURAFFTOBJS) $(CURAFFTOBJS_64) $(CURAFFTOBJS_32) $(CONTRIBOBJS)
mkdir -p lib
$(NVCC) -shared $(NVCCFLAGS) $^ -o $(DYNAMICLIB) $(LIBS)
# ---------------------------------------------------------------
check:
@echo "Building lib, all testers, and running all tests..."
$(MAKE) checkconv checkfft
checkconv: convtest
@echo "Running conv/interp only tests..."
@echo "conv 2D.............................................."
bin/conv_2d_test 0 5 5
@echo "conv 3D.............................................."
bin/conv_3d_test 2 12 12 12 800;
@echo "conv 3D.............................................."
bin/conv_3d_test 0 4096 4096 12 16777216;
bin/conv_3d_test 6 512 512 512 134217728 1e-12 0;
bin/conv_3d_test 6 2048 2048 12 1000000 1e-12 1;
checkutils: utiltest
@echo "Utilities checking..."
bin/utils_test
checkwst: w_s_test
@echo "W stacking checking..."
bin/w_s_gridder_test 6 1 4096 4096 1000000 10 1 1e-12 0
# bin/w_s_gridder_test 0 1 4096 4096 10000000 10 1 1e-12 0
# bin/w_s_gridder_test 4 1 2048 2048 100000 10 1 1e-12 1
bin/w_s_degridder_test 0 1 2048 2048 1000000 10 1 1e-12
# bin/w_s_test 0 1 5000 5000 50000000 10
checkeg: explicit_gridder_test
@echo "Explicit gridder testing..."
bin/explicit_gridder_test 20 20 20 10
checkfft: nufft_test
@echo "NUFFT testing..."
bin/nufft_1d_test 4096 4096 1e-13 0 0
bin/nufft_3d_1_test 64 64 64 262144 1e-12 0 6
bin/nufft_3d_1_test 64 64 64 262144 1e-12 0 6
bin/nufft_3d_1_test 64 64 64 262144 1e-12 0 6
bin/nufft_3d_1_test 64 64 64 262144 1e-12 0 6
bin/nufft_3d_1_test 64 64 64 262144 1e-12 0 6
bin/nufft_3d_1_test 128 128 128 2097152 1e-12 0 6
bin/nufft_3d_1_test 128 128 128 2097152 1e-12 0 6
bin/nufft_3d_1_test 128 128 128 2097152 1e-12 0 6
bin/nufft_3d_1_test 256 256 256 16777216 1e-12 0 6
bin/nufft_3d_1_test 256 256 256 16777216 1e-12 0 6
bin/nufft_3d_1_test 256 256 256 16777216 1e-12 0 6
bin/nufft_3d_1_test 512 512 256 67108864 1e-12 0 6
bin/nufft_3d_1_test 512 512 256 67108864 1e-12 0 6
bin/nufft_3d_1_test 512 512 256 67108864 1e-12 0 6
checkadjoint: adjointness_test
@echo "adjointness testing..."
bin/adjointness_1d_test
python: libtest
cp lib/libcurafft.so python/curagridder/
# -----------------------------------------------------------------
clean:
rm -f *.o
rm -f test/*.o
rm -f src/*.o
rm -f src/fourier/*.o
rm -f src/astro/*.o
rm -f contrib/*.o
rm -rf $(BINDIR)
rm -rf lib
rm -rf lib-static
.PHONY: default all libtest convtest check checkconv
.PHONY: clean