forked from pierrepaleo/PDWT
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMakefile
executable file
·37 lines (31 loc) · 1.73 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
NVCC=nvcc
#CFLAGS="-arch=sm_30"
LDFLAGS=-lcublas
PDWTCORE=src/wt.cu src/common.cu src/utils.cu src/separable.cu src/nonseparable.cu src/haar.cu src/filters.cpp src/pdwt.cpp
PDWTOBJ=build/wt.o build/common.o build/utils.o build/separable.o build/nonseparable.o build/haar.o build/filters.o build/pdwt.o
#
# Using constant memory accross several files requires to use separate compilation (relocatable device code),
# Otherwise a new constant memory buffer is created for each file (even if the symbol is defined in a common file),
# since __constant__ variables have a file scope linkage. This was fine until the introduction of Wavelets::set_filters().
# As constant memory is managed through the use of "symbols" rather than buffers, another strategy would be to
# get the pointer address with cudaGetSymbolAddress(), which is not recommended.
#
# Separate compilation might be the way to go for better modularity, easier refactoring and compilation speed.
# However, cython does not offer flexibility to make two linkage steps (one "nvcc --dlink" to link the cuda ".o" together,
# the other to link the pyx ".o" with the linked cuda ".o").
#
# If you still want to use separate compilation :
# - replace "-c $^" with "-dc $^" in the Makefile targets rules
# - uncomment the definition of SEPARATE_COMPILATION in filters.h
#
libpdwt.so: $(PDWTCORE)
mkdir -p build
$(NVCC) $(CFLAGS) --ptxas-options=-v --compiler-options '-fPIC' -odir build -c $^
$(NVCC) $(CFLAGS) -o $@ --shared $(PDWTOBJ) $(LDFLAGS)
# Double precision library
libpdwtd.so: $(PDWTCORE)
mkdir -p build
$(NVCC) --ptxas-options=-v --compiler-options '-fPIC' -DDOUBLEPRECISION -odir build -c $^
$(NVCC) $(CFLAGS) -o $@ --shared $(PDWTOBJ) $(LDFLAGS)
clean:
rm -rf build demo libpdwt*.so