2022-08-09 18:53:53 +02:00
|
|
|
CC = nvcc
|
|
|
|
LINKER = $(CC)
|
|
|
|
|
|
|
|
ANSI_CFLAGS = -ansi
|
|
|
|
ANSI_CFLAGS += -std=c99
|
|
|
|
ANSI_CFLAGS += -pedantic
|
|
|
|
ANSI_CFLAGS += -Wextra
|
|
|
|
|
2022-11-14 18:01:46 +01:00
|
|
|
#
|
|
|
|
# A100 + Native
|
2022-12-18 14:28:29 +01:00
|
|
|
#CFLAGS = -O3 -arch=sm_80 -march=native -ffast-math -funroll-loops --forward-unknown-to-host-compiler # -fopenmp
|
|
|
|
CFLAGS = -O3 -arch=compute_61 -code=sm_61,sm_80,sm_86 -march=native -ffast-math -funroll-loops --forward-unknown-to-host-compiler # -fopenmp
|
2022-11-14 18:01:46 +01:00
|
|
|
# A40 + Native
|
2022-11-14 18:21:14 +01:00
|
|
|
#CFLAGS = -O3 -arch=sm_86 -march=native -ffast-math -funroll-loops --forward-unknown-to-host-compiler # -fopenmp
|
2022-11-14 18:01:46 +01:00
|
|
|
# Cascade Lake
|
2022-11-07 20:37:01 +01:00
|
|
|
#CFLAGS = -O3 -march=cascadelake -ffast-math -funroll-loops --forward-unknown-to-host-compiler # -fopenmp
|
2022-11-14 18:01:46 +01:00
|
|
|
# For GROMACS kernels, we need at least sm_61 due to atomicAdd with doubles
|
|
|
|
# TODO: Check if this is required for full neighbor-lists and just compile kernel for that case if not
|
2022-08-09 18:53:53 +02:00
|
|
|
#CFLAGS = -O3 -g -arch=sm_61 # -fopenmp
|
|
|
|
ASFLAGS = -masm=intel
|
|
|
|
LFLAGS =
|
|
|
|
DEFINES = -D_GNU_SOURCE -DCUDA_TARGET -DNO_ZMM_INTRIN #-DLIKWID_PERFMON
|
|
|
|
INCLUDES = $(LIKWID_INC)
|
|
|
|
LIBS = -lm $(LIKWID_LIB) -lcuda -lcudart #-llikwid
|