@@ -52,12 +52,6 @@ ur_result_t setupContext(ur_context_handle_t Context, uint32_t numDevices,
52
52
return UR_RESULT_SUCCESS;
53
53
}
54
54
55
- bool isInstrumentedKernel (ur_kernel_handle_t hKernel) {
56
- auto hProgram = GetProgram (hKernel);
57
- auto PI = getAsanInterceptor ()->getProgramInfo (hProgram);
58
- return PI->isKernelInstrumented (hKernel);
59
- }
60
-
61
55
} // namespace
62
56
63
57
// /////////////////////////////////////////////////////////////////////////////
@@ -465,12 +459,6 @@ __urdlllocal ur_result_t UR_APICALL urEnqueueKernelLaunch(
465
459
466
460
getContext ()->logger .debug (" ==== urEnqueueKernelLaunch" );
467
461
468
- if (!isInstrumentedKernel (hKernel)) {
469
- return pfnKernelLaunch (hQueue, hKernel, workDim, pGlobalWorkOffset,
470
- pGlobalWorkSize, pLocalWorkSize,
471
- numEventsInWaitList, phEventWaitList, phEvent);
472
- }
473
-
474
462
USMLaunchInfo LaunchInfo (GetContext (hKernel), GetDevice (hQueue),
475
463
pGlobalWorkSize, pLocalWorkSize, pGlobalWorkOffset,
476
464
workDim);
@@ -1362,9 +1350,7 @@ __urdlllocal ur_result_t UR_APICALL urKernelCreate(
1362
1350
getContext ()->logger .debug (" ==== urKernelCreate" );
1363
1351
1364
1352
UR_CALL (pfnCreate (hProgram, pKernelName, phKernel));
1365
- if (isInstrumentedKernel (*phKernel)) {
1366
- UR_CALL (getAsanInterceptor ()->insertKernel (*phKernel));
1367
- }
1353
+ UR_CALL (getAsanInterceptor ()->insertKernel (*phKernel));
1368
1354
1369
1355
return UR_RESULT_SUCCESS;
1370
1356
}
@@ -1385,9 +1371,7 @@ __urdlllocal ur_result_t UR_APICALL urKernelRetain(
1385
1371
UR_CALL (pfnRetain (hKernel));
1386
1372
1387
1373
auto KernelInfo = getAsanInterceptor ()->getKernelInfo (hKernel);
1388
- if (KernelInfo) {
1389
- KernelInfo->RefCount ++;
1390
- }
1374
+ KernelInfo->RefCount ++;
1391
1375
1392
1376
return UR_RESULT_SUCCESS;
1393
1377
}
@@ -1407,10 +1391,8 @@ __urdlllocal ur_result_t urKernelRelease(
1407
1391
UR_CALL (pfnRelease (hKernel));
1408
1392
1409
1393
auto KernelInfo = getAsanInterceptor ()->getKernelInfo (hKernel);
1410
- if (KernelInfo) {
1411
- if (--KernelInfo->RefCount == 0 ) {
1412
- UR_CALL (getAsanInterceptor ()->eraseKernel (hKernel));
1413
- }
1394
+ if (--KernelInfo->RefCount == 0 ) {
1395
+ UR_CALL (getAsanInterceptor ()->eraseKernel (hKernel));
1414
1396
}
1415
1397
1416
1398
return UR_RESULT_SUCCESS;
@@ -1439,8 +1421,8 @@ __urdlllocal ur_result_t UR_APICALL urKernelSetArgValue(
1439
1421
std::shared_ptr<KernelInfo> KernelInfo;
1440
1422
if (argSize == sizeof (ur_mem_handle_t ) &&
1441
1423
(MemBuffer = getAsanInterceptor ()->getMemBuffer (
1442
- *ur_cast<const ur_mem_handle_t *>(pArgValue))) &&
1443
- ( KernelInfo = getAsanInterceptor ()->getKernelInfo (hKernel))) {
1424
+ *ur_cast<const ur_mem_handle_t *>(pArgValue)))) {
1425
+ auto KernelInfo = getAsanInterceptor ()->getKernelInfo (hKernel);
1444
1426
std::scoped_lock<ur_shared_mutex> Guard (KernelInfo->Mutex );
1445
1427
KernelInfo->BufferArgs [argIndex] = std::move (MemBuffer);
1446
1428
} else {
@@ -1470,8 +1452,8 @@ __urdlllocal ur_result_t UR_APICALL urKernelSetArgMemObj(
1470
1452
1471
1453
std::shared_ptr<MemBuffer> MemBuffer;
1472
1454
std::shared_ptr<KernelInfo> KernelInfo;
1473
- if ((MemBuffer = getAsanInterceptor ()->getMemBuffer (hArgValue)) &&
1474
- ( KernelInfo = getAsanInterceptor ()->getKernelInfo (hKernel))) {
1455
+ if ((MemBuffer = getAsanInterceptor ()->getMemBuffer (hArgValue))) {
1456
+ auto KernelInfo = getAsanInterceptor ()->getKernelInfo (hKernel);
1475
1457
std::scoped_lock<ur_shared_mutex> Guard (KernelInfo->Mutex );
1476
1458
KernelInfo->BufferArgs [argIndex] = std::move (MemBuffer);
1477
1459
} else {
@@ -1501,7 +1483,8 @@ __urdlllocal ur_result_t UR_APICALL urKernelSetArgLocal(
1501
1483
" ==== urKernelSetArgLocal (argIndex={}, argSize={})" , argIndex,
1502
1484
argSize);
1503
1485
1504
- if (auto KI = getAsanInterceptor ()->getKernelInfo (hKernel)) {
1486
+ {
1487
+ auto KI = getAsanInterceptor ()->getKernelInfo (hKernel);
1505
1488
std::scoped_lock<ur_shared_mutex> Guard (KI->Mutex );
1506
1489
// TODO: get local variable alignment
1507
1490
auto argSizeWithRZ = GetSizeAndRedzoneSizeForLocal (
@@ -1538,8 +1521,8 @@ __urdlllocal ur_result_t UR_APICALL urKernelSetArgPointer(
1538
1521
pArgValue);
1539
1522
1540
1523
std::shared_ptr<KernelInfo> KI;
1541
- if (getAsanInterceptor ()->getOptions ().DetectKernelArguments &&
1542
- ( KI = getAsanInterceptor ()->getKernelInfo (hKernel))) {
1524
+ if (getAsanInterceptor ()->getOptions ().DetectKernelArguments ) {
1525
+ auto KI = getAsanInterceptor ()->getKernelInfo (hKernel);
1543
1526
std::scoped_lock<ur_shared_mutex> Guard (KI->Mutex );
1544
1527
KI->PointerArgs [argIndex] = {pArgValue, GetCurrentBacktrace ()};
1545
1528
}
0 commit comments