Page Menu
Home
c4science
Search
Configure Global Search
Log In
Files
F93768012
Makefile.GPU.gnu
No One
Temporary
Actions
Download File
Edit File
Delete File
View Transforms
Subscribe
Mute Notifications
Award Token
Subscribers
None
File Metadata
Details
File Info
Storage
Attached
Created
Sun, Dec 1, 08:25
Size
3 KB
Mime Type
text/x-makefile
Expires
Tue, Dec 3, 08:25 (1 d, 23 h)
Engine
blob
Format
Raw Data
Handle
22699785
Attached To
R1448 Lenstool-HPC
Makefile.GPU.gnu
View Options
#
PROGRAM_NAME := ChiBenchmark_GPU
#all: $(PROGRAM_NAME_GPU) $(PROGRAM_NAME)
all: $(PROGRAM_NAME) $(PROGRAM_NAME_GPU)
#CXX=g++ -lm -ffast-math -ftree-loop-vectorize
CXX=mpic++
#
program_CXX_SRCS := $(wildcard *.cpp)
program_CXX_OBJS := ${program_CXX_SRCS:.cpp=.o}
#
program_C_SRCS := $(wildcard *.c)
program_C_OBJS := ${program_C_SRCS:.c=.o}
#
program_CU_SRCS := $(wildcard *.cu)
program_CU_OBJS := ${program_CU_SRCS:.cu=.cu.o}
#
# include
#
program_INCLUDE_DIRS := . /usr/local/cuda/include/ #C++ Include directories
program_INCLUDE_DIRS += $(CFITSIO_ROOT)/include
program_INCLUDE_DIRS += $(LENSTOOL_ROOT)/include
program_INCLUDE_DIRS += $(GSL_ROOT)/include
program_INCLUDE_DIRS += $(LENSTOOLHPC_ROOT)/src
program_INCLUDE_DIRS += $(CUDA_ROOT)/include
#
# libs
#
program_INCLUDE_LIBS += $(CFITSIO_ROOT)/lib #Include libraries
program_INCLUDE_LIBS += $(LENSTOOL_ROOT)/src
program_INCLUDE_LIBS += $(LENSTOOL_ROOT)/liblt
program_INCLUDE_LIBS += $(LENSTOOLHPC_ROOT)/src
program_INCLUDE_LIBS += $(GSL_ROOT)/lib
program_INCLUDE_LIBS += $(WCSTOOL_ROOT)/libwcs
program_INCLUDE_LIBS += $(CUDA_ROOT)/lib64
#
# Compiler flags
#
CXXFLAGS += $(foreach includedir,$(program_INCLUDE_DIRS),-I$(includedir))
CXXFLAGS += $(foreach includelib,$(program_INCLUDE_LIBS),-L$(includelib))
#CXXFLAGS += -D__WITH_LENSTOOL
CXXFLAGS += -D__WITH_MPI
CXXFLAGS += -D__WITH_UM
CXXFLAGS += -D__WITH_GPU
include ../../src/cpuflags.gnu.inc
include $(LENSTOOLHPC_ROOT)/src/precision.inc
CXXFLAGS += $(PRECISION)
#CXXFLAGS += -no-vec
#CXXFLAGS += -qopenmp -march=core-avx2 -g -O3 -std=c++0x -Wall -pedantic
#CXXFLAGS += -llenstoolhpc -qopenmp -xHost -g -O3 -std=c++0x -Wall -pedantic
#CXXFLAGS += -llenstoolhpc -qopenmp -axMIC-AVX512,CORE-AVX2 -g -O3 -std=c++0x -Wall -pedantic
#CXXFLAGS += -qopt-prefetch-distance=64,8 -qopt-streaming-cache-evict=0 -llenstoolhpc -qopenmp -xMIC-AVX512 -g -O3 -std=c++0x -Wall -pedantic
LDFLAGS := -llenstoolhpc -llenstoolhpc -llenstoolhpc_GPU -llt -lcfitsio -lwcs -lgsl -lgslcblas -llenstool #Do not keep lenstool for the float calculation, it creates conflictinthe structure.h file
#
#NVFLAGS := -O3 -g -G -rdc=true -ccbin icpc -Xcompiler '-Wall -fPIC -qopenmp' -D__WITH_LENSTOOL
#NVFLAGS := -O3 -ccbin icpc -Xcompiler '-Wall -fPIC -qopenmp' -D__WITH_LENSTOOL
include ../../src/gpuflags.inc
include ../../src/gpusm.inc
NVFLAGS += -ccbin $(CXX) -Xcompiler '-Wall -fPIC -qopenmp -Ofast $(PRECISION)'
#NVFLAGS += -ccbin $(CXX) -Xcompiler '$(CXXFLAGS)'
NVFLAGS += $(GENCODE) $(PRECISION) -D__WITH_MPI
#NVFLAGS += --maxrregcount=64
#NVFLAGS += -G
#NVFLAGS += -D__WITH_UM
#NVFLAGS += -D_double
#NVFLAGS += -gencode arch=compute_60,code=sm_60
#NVFLAGS += -use_fast_math
NVFLAGS += $(foreach includedir,$(program_INCLUDE_DIRS),-I$(includedir))
NVFLAGS += $(foreach includelib,$(program_INCLUDE_LIBS),-L$(includelib))
#
NVLDFLAGS += $(foreach includedir,$(program_INCLUDE_DIRS),-I$(includedir))
NVLDFLAGS += $(foreach includelib,$(program_INCLUDE_LIBS),-L$(includelib))
NVLDFLAGS += -lcudart -lcudadevrt -lnvToolsExt
#
LDFLAGS += $(foreach includedir,$(program_INCLUDE_DIRS),-I$(includedir))
LDFLAGS += $(foreach includelib,$(program_INCLUDE_LIBS),-L$(includelib))
NVLDFLAGS += $(LDFLAGS)
#
#LDFLAGS += -O3 -g -qopenmp
#LDFLAGS += -qopenmp
GPU_OBJECTS = $(program_CU_OBJS)
CPU_OBJECTS = $(program_CXX_OBJS) $(program_C_OBJS)
#
%.cu.o: %.cu %.cuh
nvcc $(NVFLAGS) -o $@ -c $<
#nvcc $(NVFLAGS) -o $@ -rdc=true $<
#nvcc $(NVFLAGS) -Xptxas -dlcm=cg --ptxas-options=-v -o $@ -dc $<
#
%.cpp: %.cpp %.h
$(CXX) $(CXXFLAGS) -o $@ $< $(CXXFLAGS)
#
$(PROGRAM_NAME): $(CPU_OBJECTS) $(GPU_OBJECTS)
$(CXX) -o $@ $(program_CU_OBJS) $(program_CXX_OBJS) $(program_C_OBJS) $(LDFLAGS) $(NVLDFLAGS) $(CXXFLAGS)
#$(PROGRAM_NAME): $(CPU_OBJECTS)
# icpc -o $@ $^ $(LDFLAGS)
clean:
@- $(RM) $(PROGRAM_NAME) $(OBJECTS) *~ *.o *.optrpt
distclean: clean
.PHONY: all clean distclean
Event Timeline
Log In to Comment