blob: 979c80f263487cc3db577d95b6347d1a18a835b8 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
|
CC = gcc
CXX = g++
CPP =
FC = mpifort
LD = mpifort
NVCC = nvcc
GPUVER = $(_gpuver)
AR = ar -r
DFLAGS = -D__FFTW3 \
-D__LIBINT \
-D__parallel -D__SCALAPACK \
-D__ELPA \
-D__LIBXSMM \
-D__LIBXC \
-D__SPGLIB \
-D__ACC -D__DBCSR_ACC -D__PW_CUDA -D__GRID_CUDA
INCS = -I/usr/include \
-I/usr/include/elpa_openmp-$(_elpaver)/elpa \
-I/usr/include/elpa_openmp-$(_elpaver)/modules \
-I/opt/cuda/include
OPTFLAGS = -O3 -march=native -fopenmp
CFLAGS = $(DFLAGS) $(INCS) $(OPTFLAGS)
CXXFLAGS = $(DFLAGS) $(INCS) $(OPTFLAGS) -std=c++11
CPPFLAGS =
FCFLAGS = $(DFLAGS) $(INCS) $(OPTFLAGS) \
-ffree-form -ffree-line-length-none \
-fallow-argument-mismatch
NVFLAGS = $(DFLAGS) -O3 -Xcompiler="-fopenmp" \
-gencode arch=compute_35,code=sm_35 \
-gencode arch=compute_37,code=sm_37 \
-gencode arch=compute_50,code=sm_50 \
-gencode arch=compute_52,code=sm_52 \
-gencode arch=compute_60,code=sm_60 \
-gencode arch=compute_61,code=sm_61 \
-gencode arch=compute_70,code=sm_70 \
-gencode arch=compute_75,code=sm_75 \
-gencode arch=compute_80,code=sm_80 \
-gencode arch=compute_86,code=sm_86 \
-Wno-deprecated-gpu-targets
LDFLAGS = $(FCFLAGS)
LIBS = -L/opt/cuda/lib64 -lcudart -lcuda \
-lcublas -lcufft -lrt -lnvrtc \
-lxsmmf -lxsmm \
-lelpa_openmp -lcosma -lscalapack -lblas -llapack \
-lfftw3 -lfftw3_threads \
/usr/lib/libint2.a \
-lxcf03 -lxc \
-lsymspg \
-lstdc++ -lpthread -lm -ldl -lz
|