mirror of
https://github.com/slsdetectorgroup/aare.git
synced 2026-06-05 16:48:41 +02:00
3ed773e520
- Wrap per-stream CUDA resources (device buffers, stream handle) in StreamContext struct; ClusterFinderCUDA owns a vector of n_streams contexts with independent pedestal arrays - Split ClusterFinderCUDA.cuh into clusterfinder_kernel.cuh (device kernel) and ClusterFinderCUDA.hpp (host RAII wrapper) - Add find_clusters_batched(): processes N frames round-robin across streams, returns per-frame cluster vectors. - Update ClusterFinderCUDA.test.cu - Update Makefile for new file layout.
24 lines
637 B
Makefile
24 lines
637 B
Makefile
CXX := /usr/bin/c++
|
|
NVCC := nvcc
|
|
ARCH := -arch=sm_89
|
|
CXXFLAGS := -std=c++17 -O3 --extended-lambda -ccbin $(CXX)
|
|
INCLUDES := -I../include -I../build/_deps/fmt-src/include
|
|
LDFLAGS := -L../build -L../build/_deps/fmt-build
|
|
LIBS := -laare_core -lfmt -lstdc++fs
|
|
DEFINES := -DAARE_LOG_LEVEL=logERROR
|
|
|
|
TARGET := test_cf_cuda
|
|
SRC := ClusterFinderCUDA.test.cu
|
|
DEP := $(SRC:.cu=.d)
|
|
|
|
all: $(TARGET)
|
|
|
|
$(TARGET): $(SRC) ../include/aare/clusterfinder_kernel.cuh
|
|
$(NVCC) -Xptxas=-v $(ARCH) $(CXXFLAGS) $(DEFINES) $(INCLUDES) $(LDFLAGS) $< -o $@ $(LIBS)
|
|
|
|
clean:
|
|
rm -f $(TARGET) $(DEP)
|
|
|
|
-include $(DEP)
|
|
|
|
.PHONY: all clean |