@@ -24,15 +24,13 @@ inline void storeTokenIfNotNull(KernelInfo &kernelInfo, T *token) {
2424 kernelInfo.storePatchToken (token);
2525 }
2626}
27-
2827template <typename T>
2928inline uint32_t getOffset (T *token) {
3029 if (token != nullptr ) {
3130 return token->Offset ;
3231 }
33- return WorkloadInfo::undefinedOffset ;
32+ return undefined< uint32_t > ;
3433}
35-
3634void populateKernelInfoArgMetadata (KernelInfo &dstKernelInfoArg, const SPatchKernelArgumentInfo *src) {
3735 if (nullptr == src) {
3836 return ;
@@ -158,7 +156,7 @@ void populateKernelInfo(KernelInfo &dst, const PatchTokenBinary::KernelFromPatch
158156
159157 storeTokenIfNotNull (dst, src.tokens .executionEnvironment );
160158 dst.usesSsh = src.tokens .bindingTableState && (src.tokens .bindingTableState ->Count > 0 );
161- dst.workloadInfo . slmStaticSize = src.tokens .allocateLocalSurface ? src.tokens .allocateLocalSurface ->TotalInlineLocalMemorySize : 0U ;
159+ dst.kernelDescriptor . kernelAttributes . slmInlineSize = src.tokens .allocateLocalSurface ? src.tokens .allocateLocalSurface ->TotalInlineLocalMemorySize : 0U ;
162160
163161 dst.kernelArgInfo .resize (src.tokens .kernelArgs .size ());
164162
@@ -178,23 +176,6 @@ void populateKernelInfo(KernelInfo &dst, const PatchTokenBinary::KernelFromPatch
178176 dst.isVmeWorkload = dst.isVmeWorkload || (src.tokens .inlineVmeSamplerInfo != nullptr );
179177 dst.systemKernelOffset = src.tokens .stateSip ? src.tokens .stateSip ->SystemKernelOffset : 0U ;
180178
181- for (uint32_t i = 0 ; i < 3U ; ++i) {
182- dst.workloadInfo .localWorkSizeOffsets [i] = getOffset (src.tokens .crossThreadPayloadArgs .localWorkSize [i]);
183- dst.workloadInfo .localWorkSizeOffsets2 [i] = getOffset (src.tokens .crossThreadPayloadArgs .localWorkSize2 [i]);
184- dst.workloadInfo .globalWorkOffsetOffsets [i] = getOffset (src.tokens .crossThreadPayloadArgs .globalWorkOffset [i]);
185- dst.workloadInfo .enqueuedLocalWorkSizeOffsets [i] = getOffset (src.tokens .crossThreadPayloadArgs .enqueuedLocalWorkSize [i]);
186- dst.workloadInfo .globalWorkSizeOffsets [i] = getOffset (src.tokens .crossThreadPayloadArgs .globalWorkSize [i]);
187- dst.workloadInfo .numWorkGroupsOffset [i] = getOffset (src.tokens .crossThreadPayloadArgs .numWorkGroups [i]);
188- }
189-
190- dst.workloadInfo .maxWorkGroupSizeOffset = getOffset (src.tokens .crossThreadPayloadArgs .maxWorkGroupSize );
191- dst.workloadInfo .workDimOffset = getOffset (src.tokens .crossThreadPayloadArgs .workDimensions );
192- dst.workloadInfo .simdSizeOffset = getOffset (src.tokens .crossThreadPayloadArgs .simdSize );
193- dst.workloadInfo .parentEventOffset = getOffset (src.tokens .crossThreadPayloadArgs .parentEvent );
194- dst.workloadInfo .preferredWkgMultipleOffset = getOffset (src.tokens .crossThreadPayloadArgs .preferredWorkgroupMultiple );
195- dst.workloadInfo .privateMemoryStatelessSizeOffset = getOffset (src.tokens .crossThreadPayloadArgs .privateMemoryStatelessSize );
196- dst.workloadInfo .localMemoryStatelessWindowSizeOffset = getOffset (src.tokens .crossThreadPayloadArgs .localMemoryStatelessWindowSize );
197- dst.workloadInfo .localMemoryStatelessWindowStartAddressOffset = getOffset (src.tokens .crossThreadPayloadArgs .localMemoryStatelessWindowStartAddress );
198179 for (auto &childSimdSize : src.tokens .crossThreadPayloadArgs .childBlockSimdSize ) {
199180 dst.childrenKernelsIdOffset .push_back ({childSimdSize->ArgumentNumber , childSimdSize->Offset });
200181 }
0 commit comments