From 9f2dbfa7df981d41c070261c4b9a8a875b290203 Mon Sep 17 00:00:00 2001 From: AlexeyAB Date: Tue, 17 Apr 2018 14:39:27 +0300 Subject: [PATCH] Added flag AVX to the Makefile --- Makefile | 10 +++++++++- 1 file changed, 9 insertions(+), 1 deletion(-) diff --git a/Makefile b/Makefile index b6119ae5..61861b54 100644 --- a/Makefile +++ b/Makefile @@ -2,10 +2,16 @@ GPU=0 CUDNN=0 CUDNN_HALF=0 OPENCV=0 -DEBUG=0 +AVX=0 OPENMP=0 LIBSO=0 +# set GPU=1 and CUDNN=1 to speedup on GPU +# set CUDNN_HALF=1 to further speedup 3 x times (Mixed-precision using Tensor Cores) on GPU Tesla V100, Titan V, DGX-2 +# set AVX=1 and OPENMP=1 to speedup on CPU (if error occurs then set AVX=0) + +DEBUG=0 + ARCH= -gencode arch=compute_30,code=sm_30 \ -gencode arch=compute_35,code=sm_35 \ -gencode arch=compute_50,code=[sm_50,compute_50] \ @@ -50,8 +56,10 @@ CFLAGS=-Wall -Wfatal-errors -Wno-unused-result -Wno-unknown-pragmas ifeq ($(DEBUG), 1) OPTS= -O0 -g else +ifeq ($(AVX), 1) CFLAGS+= -ffp-contract=fast -mavx endif +endif CFLAGS+=$(OPTS)