export CC = gcc-5
export CXX = g++-5
-all: libpremnotify-cpu
+all: libpremnotify
all: passes
llvm-clang: build/bin/opt
-DCMAKE_CXX_FLAGS='-DHERCULES_PASS_ROOT=\"$(PREFIX)/lib/hercules/\"' \
-G "Ninja" $(CURDIR)/llvm
-libpremnotify-cpu: export CC=$(DEB_HOST_GNU_TYPE)-gcc
+libpremnotify: export CC=$(DEB_HOST_GNU_TYPE)-gcc
endif
< $< > $@
chmod +x $@
-libpremnotify-cpu:
+libpremnotify:
$(MAKE) -C HerculesCompiler/libpremnotify
install: all
--- /dev/null
+--- hercules-compiler.orig/HerculesCompiler/libpremnotify/Makefile
++++ hercules-compiler/HerculesCompiler/libpremnotify/Makefile
+@@ -1,12 +1,22 @@
+ PREFIX=/usr/local
++NVCC=$(or $(shell which nvcc),$(wildcard /usr/local/cuda/bin/nvcc),nvcc)
+
+-all: libpremnotify-cpu.a
++all: libpremnotify-cpu.a libpremnotify-gpu.a
+
+ libpremnotify-cpu.a: libpremnotify-cpu.o
+ $(AR) rcs $@ $^
+
++libpremnotify-gpu.a: libpremnotify-gpu.o
++ $(AR) qc $@ $^
++ ranlib libpremnotify-gpu.a
++
++libpremnotify-gpu.o:
++ $(NVCC) -ccbin $(CC) -arch=compute_62 -code=sm_62 -dc libpremnotify-gpu.cu -Xptxas -v -Xnvlink -v -Xptxas -maxrregcount=16,-func-maxrregcount=16 -o libpremnotify-gpu.o
++
+ install: all
+ install -D -m 644 libpremnotify-cpu.a $(DESTDIR)$(PREFIX)/lib/hercules/libpremnotify-cpu.a
++ install -D -m 644 libpremnotify-gpu.a $(DESTDIR)$(PREFIX)/lib/hercules/libpremnotify-gpu.a
+
+ clean:
+ rm -rf libpremnotify-cpu.o libpremnotify-cpu.a
++ rm -rf libpremnotify-gpu.o libpremnotify-gpu.a