@@ -130,21 +130,21 @@ GPUg() void runKernelHIP(GPUCA_CONSMEM_PTR int iSlice_internal, Args... args)
130130#undef GPUCA_KRNL_CUSTOM
131131#define GPUCA_KRNL_CUSTOM (args ) GPUCA_M_STRIP(args)
132132#undef GPUCA_KRNL_BACKEND_XARGS
133- #define GPUCA_KRNL_BACKEND_XARGS hipEvent_t *start , hipEvent_t *stop ,
133+ #define GPUCA_KRNL_BACKEND_XARGS hipEvent_t *debugStartEvent , hipEvent_t *debugStopEvent ,
134134#define GPUCA_KRNL (x_class, x_attributes, x_arguments, x_forward ) \
135135 GPUCA_KRNL_PROP (x_class, x_attributes) \
136136 GPUCA_KRNL_WRAP(GPUCA_KRNL_, x_class, x_attributes, x_arguments, x_forward)
137- #define GPUCA_KRNL_CALL_single (x_class, x_attributes, x_arguments, x_forward ) \
138- if (start == nullptr ) { \
139- hipLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT (krnl_, GPUCA_M_KRNL_NAME (x_class))), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], GPUCA_CONSMEM_CALL y.start , args...); \
140- } else { \
141- hipExtLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT (krnl_, GPUCA_M_KRNL_NAME (x_class))), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], *start , *stop , 0 , GPUCA_CONSMEM_CALL y.start , args...); \
142- }
143- #define GPUCA_KRNL_CALL_multi (x_class, x_attributes, x_arguments, x_forward ) \
144- if (start == nullptr ) { \
145- hipLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT3 (krnl_, GPUCA_M_KRNL_NAME (x_class), _multi)), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], GPUCA_CONSMEM_CALL y.start , y.num , args...); \
146- } else { \
147- hipExtLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT3 (krnl_, GPUCA_M_KRNL_NAME (x_class), _multi)), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], *start , *stop , 0 , GPUCA_CONSMEM_CALL y.start , y.num , args...); \
137+ #define GPUCA_KRNL_CALL_single (x_class, x_attributes, x_arguments, x_forward ) \
138+ if (debugStartEvent == nullptr ) { \
139+ hipLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT (krnl_, GPUCA_M_KRNL_NAME (x_class))), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], GPUCA_CONSMEM_CALL y.start , args...); \
140+ } else { \
141+ hipExtLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT (krnl_, GPUCA_M_KRNL_NAME (x_class))), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], *debugStartEvent , *debugStopEvent , 0 , GPUCA_CONSMEM_CALL y.start , args...); \
142+ }
143+ #define GPUCA_KRNL_CALL_multi (x_class, x_attributes, x_arguments, x_forward ) \
144+ if (debugStartEvent == nullptr ) { \
145+ hipLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT3 (krnl_, GPUCA_M_KRNL_NAME (x_class), _multi)), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], GPUCA_CONSMEM_CALL y.start , y.num , args...); \
146+ } else { \
147+ hipExtLaunchKernelGGL (HIP_KERNEL_NAME (GPUCA_M_CAT3 (krnl_, GPUCA_M_KRNL_NAME (x_class), _multi)), dim3 (x.nBlocks ), dim3 (x.nThreads ), 0 , me->mInternals ->Streams [x.stream ], *debugStartEvent , *debugStopEvent , 0 , GPUCA_CONSMEM_CALL y.start , y.num , args...); \
148148 }
149149#include " GPUReconstructionKernels.h"
150150#undef GPUCA_KRNL
0 commit comments