|
|
|
@ -185,8 +185,13 @@ void CUPTIAPI bufferCompleted(CUcontext ctx, uint32_t streamId, uint8_t *buffer,
|
|
|
|
|
switch (record->kind) {
|
|
|
|
|
case CUPTI_ACTIVITY_KIND_KERNEL:
|
|
|
|
|
case CUPTI_ACTIVITY_KIND_CONCURRENT_KERNEL: {
|
|
|
|
|
#if CUDA_VERSION >= 9000
|
|
|
|
|
auto *kernel =
|
|
|
|
|
reinterpret_cast<const CUpti_ActivityKernel4 *>(record);
|
|
|
|
|
#else
|
|
|
|
|
auto *kernel =
|
|
|
|
|
reinterpret_cast<const CUpti_ActivityKernel3 *>(record);
|
|
|
|
|
#endif
|
|
|
|
|
tracer->AddKernelRecords(kernel->name, kernel->start, kernel->end,
|
|
|
|
|
kernel->deviceId, kernel->streamId,
|
|
|
|
|
kernel->correlationId);
|
|
|
|
|