From d1ad229d67de5d37761340d4e41929609664d4e9 Mon Sep 17 00:00:00 2001 From: Stefan Roiser Date: Fri, 2 Oct 2020 21:07:45 +0200 Subject: [PATCH 1/2] ignore perf data (cherry picked from commit cb2309c77a849ec360da7bdd2d70bce8131e37ef) --- .gitignore | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index f8957c4749..130af32b5f 100644 --- a/.gitignore +++ b/.gitignore @@ -8,7 +8,10 @@ *.local.log *.local *~ -/local/ +local/ # profiling profile_* + +# perf data +*-perf-test-run*.json From fe2903787847d522078a0c07cce879beb9608606 Mon Sep 17 00:00:00 2001 From: Stefan Roiser Date: Fri, 2 Oct 2020 21:07:59 +0200 Subject: [PATCH 2/2] fix debug version build (cherry picked from commit 31a8fdadf2435ed486aed716474f2a8227e9571c) --- examples/gpu/eemumu_AV/SubProcesses/Makefile | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/examples/gpu/eemumu_AV/SubProcesses/Makefile b/examples/gpu/eemumu_AV/SubProcesses/Makefile index a138733070..9dbedec357 100644 --- a/examples/gpu/eemumu_AV/SubProcesses/Makefile +++ b/examples/gpu/eemumu_AV/SubProcesses/Makefile @@ -5,6 +5,7 @@ INCDIR=../../src MODELLIB=model_sm CXXFLAGS= -O3 -I. -I$(INCDIR) -DUSE_NVTX -Wall -Wshadow CUARCHFLAGS= -arch=compute_$(CUARCHNUM) +# CUARCHFLAGS= -gencode arch=compute_$(CUARCHNUM),code=sm_$(CUARCHNUM) CUFLAGS= -O3 -I. -I$(INCDIR) -DUSE_NVTX $(CUARCHFLAGS) -use_fast_math -lineinfo # Without -maxrregcount: baseline throughput: 6.5E8 (16384 32 12) up to 7.3E8 (65536 128 12) ###CUFLAGS+= --maxrregcount 160 # improves throughput: 6.9E8 (16384 32 12) up to 7.7E8 (65536 128 12) @@ -38,9 +39,10 @@ all: debug: CXXFLAGS:=$(filter-out -O3,$(CXXFLAGS)) debug: CXXFLAGS += -g -O0 -DDEBUG2 debug: CUFLAGS:=$(filter-out -lineinfo,$(CUFLAGS)) -debug: CUFLAGS += -G +debug: CUFLAGS:=$(filter-out -O3,$(CUFLAGS)) +debug: CUFLAGS += -g -G debug: MAKEDEBUG := debug -debug: $(cu_main) +debug: $(cu_main) $(cxx_main) $(LIBDIR)/lib$(MODELLIB).a: @cd ../../src && make $(MAKEDEBUG)