@@ -1988,7 +1988,7 @@ std::string instrumentationGetKernelName(
19881988void instrumentationAddExtraKernelMetadata (
19891989 xpti_td *&CmdTraceEvent, const NDRDescT &NDRDesc,
19901990 detail::kernel_bundle_impl *KernelBundleImplPtr,
1991- KernelNameStrRefT KernelName, KernelNameBasedData *KernelNameBasedDataPtr ,
1991+ KernelNameStrRefT KernelName, KernelNameBasedData &KernelNameBasedData ,
19921992 const std::shared_ptr<detail::kernel_impl> &SyclKernel, queue_impl *Queue,
19931993 std::vector<ArgDesc> &CGArgs) // CGArgs are not const since they could be
19941994 // sorted in this function
@@ -2012,11 +2012,10 @@ void instrumentationAddExtraKernelMetadata(
20122012 // NOTE: Queue can be null when kernel is directly enqueued to a command
20132013 // buffer
20142014 // by graph API, when a modifiable graph is finalized.
2015- assert (KernelNameBasedDataPtr);
20162015 FastKernelCacheValPtr FastKernelCacheVal =
20172016 detail::ProgramManager::getInstance ().getOrCreateKernel (
20182017 Queue->getContextImpl (), Queue->getDeviceImpl (), KernelName,
2019- *KernelNameBasedDataPtr );
2018+ KernelNameBasedData );
20202019 EliminatedArgMask = FastKernelCacheVal->MKernelArgMask ;
20212020 }
20222021
@@ -2104,7 +2103,7 @@ std::pair<xpti_td *, uint64_t> emitKernelInstrumentationData(
21042103 const std::shared_ptr<detail::kernel_impl> &SyclKernel,
21052104 const detail::code_location &CodeLoc, bool IsTopCodeLoc,
21062105 const std::string_view SyclKernelName,
2107- KernelNameBasedData *KernelNameBasedDataPtr , queue_impl *Queue,
2106+ KernelNameBasedData &KernelNameBasedData , queue_impl *Queue,
21082107 const NDRDescT &NDRDesc, detail::kernel_bundle_impl *KernelBundleImplPtr,
21092108 std::vector<ArgDesc> &CGArgs) {
21102109
@@ -2143,7 +2142,7 @@ std::pair<xpti_td *, uint64_t> emitKernelInstrumentationData(
21432142 getQueueID (Queue));
21442143 instrumentationAddExtraKernelMetadata (
21452144 CmdTraceEvent, NDRDesc, KernelBundleImplPtr,
2146- std::string (SyclKernelName), KernelNameBasedDataPtr , SyclKernel, Queue,
2145+ std::string (SyclKernelName), KernelNameBasedData , SyclKernel, Queue,
21472146 CGArgs);
21482147
21492148 xptiNotifySubscribers (
@@ -2199,7 +2198,7 @@ void ExecCGCommand::emitInstrumentationData() {
21992198 reinterpret_cast <detail::CGExecKernel *>(MCommandGroup.get ());
22002199 instrumentationAddExtraKernelMetadata (
22012200 CmdTraceEvent, KernelCG->MNDRDesc , KernelCG->getKernelBundle ().get (),
2202- KernelCG->MKernelName , KernelCG->MKernelNameBasedDataPtr ,
2201+ KernelCG->MKernelName , KernelCG->MKernelNameBasedData ,
22032202 KernelCG->MSyclKernel , MQueue.get (), KernelCG->MArgs );
22042203 }
22052204
@@ -2401,7 +2400,7 @@ static ur_result_t SetKernelParamsAndLaunch(
24012400 const std::function<void *(Requirement *Req)> &getMemAllocationFunc,
24022401 bool IsCooperative, bool KernelUsesClusterLaunch,
24032402 uint32_t WorkGroupMemorySize, const RTDeviceBinaryImage *BinImage,
2404- KernelNameStrRefT KernelName, KernelNameBasedData *KernelNameBasedDataPtr ,
2403+ KernelNameStrRefT KernelName, KernelNameBasedData &KernelNameBasedData ,
24052404 void *KernelFuncPtr = nullptr, int KernelNumArgs = 0,
24062405 detail::kernel_param_desc_t (*KernelParamDescGetter)(int ) = nullptr,
24072406 bool KernelHasSpecialCaptures = true) {
@@ -2448,7 +2447,7 @@ static ur_result_t SetKernelParamsAndLaunch(
24482447 }
24492448
24502449 const std::optional<int > &ImplicitLocalArg =
2451- KernelNameBasedDataPtr-> getImplicitLocalArgPos ();
2450+ KernelNameBasedData. getImplicitLocalArgPos ();
24522451 // Set the implicit local memory buffer to support
24532452 // get_work_group_scratch_memory. This is for backend not supporting
24542453 // CUDA-style local memory setting. Note that we may have -1 as a position,
@@ -2549,11 +2548,10 @@ getCGKernelInfo(const CGExecKernel &CommandGroup, context_impl &ContextImpl,
25492548 DeviceImageImpl = &SyclKernelImpl->getDeviceImage ();
25502549 EliminatedArgMask = SyclKernelImpl->getKernelArgMask ();
25512550 } else {
2552- assert (CommandGroup.MKernelNameBasedDataPtr );
25532551 FastKernelCacheValPtr FastKernelCacheVal =
25542552 sycl::detail::ProgramManager::getInstance ().getOrCreateKernel (
25552553 ContextImpl, DeviceImpl, CommandGroup.MKernelName ,
2556- * CommandGroup.MKernelNameBasedDataPtr );
2554+ CommandGroup.MKernelNameBasedData );
25572555 UrKernel = FastKernelCacheVal->MKernelHandle ;
25582556 EliminatedArgMask = FastKernelCacheVal->MKernelArgMask ;
25592557 // To keep UrKernel valid, we return FastKernelCacheValPtr.
@@ -2668,7 +2666,7 @@ void enqueueImpKernel(
26682666 queue_impl &Queue, NDRDescT &NDRDesc, std::vector<ArgDesc> &Args,
26692667 detail::kernel_bundle_impl *KernelBundleImplPtr,
26702668 const detail::kernel_impl *MSyclKernel, KernelNameStrRefT KernelName,
2671- KernelNameBasedData *KernelNameBasedDataPtr ,
2669+ KernelNameBasedData &KernelNameBasedData ,
26722670 std::vector<ur_event_handle_t > &RawEvents, detail::event_impl *OutEventImpl,
26732671 const std::function<void *(Requirement *Req)> &getMemAllocationFunc,
26742672 ur_kernel_cache_config_t KernelCacheConfig, const bool KernelIsCooperative,
@@ -2714,9 +2712,8 @@ void enqueueImpKernel(
27142712 EliminatedArgMask = SyclKernelImpl->getKernelArgMask ();
27152713 KernelMutex = SyclKernelImpl->getCacheMutex ();
27162714 } else {
2717- assert (KernelNameBasedDataPtr);
27182715 KernelCacheVal = detail::ProgramManager::getInstance ().getOrCreateKernel (
2719- ContextImpl, DeviceImpl, KernelName, *KernelNameBasedDataPtr , NDRDesc);
2716+ ContextImpl, DeviceImpl, KernelName, KernelNameBasedData , NDRDesc);
27202717 Kernel = KernelCacheVal->MKernelHandle ;
27212718 KernelMutex = KernelCacheVal->MMutex ;
27222719 Program = KernelCacheVal->MProgramHandle ;
@@ -2763,8 +2760,8 @@ void enqueueImpKernel(
27632760 Queue, Args, DeviceImageImpl, Kernel, NDRDesc, EventsWaitList,
27642761 OutEventImpl, EliminatedArgMask, getMemAllocationFunc,
27652762 KernelIsCooperative, KernelUsesClusterLaunch, WorkGroupMemorySize,
2766- BinImage, KernelName, KernelNameBasedDataPtr , KernelFuncPtr,
2767- KernelNumArgs, KernelParamDescGetter, KernelHasSpecialCaptures);
2763+ BinImage, KernelName, KernelNameBasedData , KernelFuncPtr, KernelNumArgs ,
2764+ KernelParamDescGetter, KernelHasSpecialCaptures);
27682765 }
27692766 if (UR_RESULT_SUCCESS != Error) {
27702767 // If we have got non-success error code, let's analyze it to emit nice
@@ -3243,7 +3240,7 @@ ur_result_t ExecCGCommand::enqueueImpQueue() {
32433240 if (!EventImpl) {
32443241 // Kernel only uses assert if it's non interop one
32453242 bool KernelUsesAssert = (!SyclKernel || SyclKernel->hasSYCLMetadata ()) &&
3246- ExecKernel->MKernelNameBasedDataPtr -> usesAssert ();
3243+ ExecKernel->MKernelNameBasedData . usesAssert ();
32473244 if (KernelUsesAssert) {
32483245 EventImpl = MEvent.get ();
32493246 }
@@ -3256,7 +3253,7 @@ ur_result_t ExecCGCommand::enqueueImpQueue() {
32563253 }
32573254 enqueueImpKernel (
32583255 *MQueue, NDRDesc, Args, ExecKernel->getKernelBundle ().get (),
3259- SyclKernel.get (), KernelName, ExecKernel->MKernelNameBasedDataPtr ,
3256+ SyclKernel.get (), KernelName, ExecKernel->MKernelNameBasedData ,
32603257 RawEvents, EventImpl, getMemAllocationFunc,
32613258 ExecKernel->MKernelCacheConfig , ExecKernel->MKernelIsCooperative ,
32623259 ExecKernel->MKernelUsesClusterLaunch ,
0 commit comments