@@ -333,3 +333,38 @@ entry:
333333 store double %call1 , double addrspace (1 )* %arrayidx2 , align 8
334334 ret void
335335}
336+
337+ define spir_kernel void @si64tofp_kernel (i64 addrspace (1 )* %inA , double addrspace (1 )* %out , <8 x i32 > %r0 , <8 x i32 > %payloadHeader , <3 x i32 > %enqueuedLocalSize , i16 %localIdX , i16 %localIdY , i16 %localIdZ , i8* %privateBase , i32 %bufferOffset , i32 %bufferOffset1 , i32 %bindlessOffset , i32 %bindlessOffset2 ) #0 {
338+ ; CHECK-LABEL: @si64tofp_kernel(
339+ ; CHECK: entry:
340+ ; CHECK: [[DPEmuFlag:%.*]] = alloca i32
341+ ; CHECK: [[TMP0:%.*]] = extractelement <8 x i32> %payloadHeader, i64 0
342+ ; CHECK: [[TMP1:%.*]] = extractelement <3 x i32> %enqueuedLocalSize, i64 0
343+ ; CHECK: [[TMP2:%.*]] = extractelement <8 x i32> %r0, i64 1
344+ ; CHECK: [[MUL:%.*]] = mul i32 [[TMP1]], [[TMP2]]
345+ ; CHECK: [[LOCAL_ID_X:%.*]] = zext i16 %localIdX to i32
346+ ; CHECK: [[ADD0:%.*]] = add i32 [[MUL]], [[LOCAL_ID_X]]
347+ ; CHECK: [[ADD1:%.*]] = add i32 [[ADD0]], [[TMP0]]
348+ ; CHECK: [[CONV0:%.*]] = zext i32 [[ADD1]] to i64
349+ ; CHECK: [[ARRAY_IDX0:%.*]] = getelementptr inbounds i64, i64 addrspace(1)* %inA, i64 [[CONV0]]
350+ ; CHECK: [[TMP3:%.*]] = load i64, i64 addrspace(1)* [[ARRAY_IDX0]], align 8
351+ ; CHECK: [[CALL_TMP:%.*]] = call double @__igcbuiltin_int64_to_dp(i64 [[TMP3]], i32 0, i32* [[DPEmuFlag]])
352+ ; CHECK: [[ARRAY_IDX1:%.*]] = getelementptr inbounds double, double addrspace(1)* %out, i64 [[CONV0]]
353+ ; CHECK: store double [[CALL_TMP]], double addrspace(1)* [[ARRAY_IDX1]], align 8
354+ ; CHECK: ret void
355+ entry:
356+ %payloadHeader.scalar = extractelement <8 x i32 > %payloadHeader , i64 0
357+ %enqueuedLocalSize.scalar = extractelement <3 x i32 > %enqueuedLocalSize , i64 0
358+ %r0.scalar19 = extractelement <8 x i32 > %r0 , i64 1
359+ %0 = mul i32 %enqueuedLocalSize.scalar , %r0.scalar19
360+ %localIdX4 = zext i16 %localIdX to i32
361+ %1 = add i32 %0 , %localIdX4
362+ %2 = add i32 %1 , %payloadHeader.scalar
363+ %3 = zext i32 %2 to i64
364+ %arrayidx = getelementptr inbounds i64 , i64 addrspace (1 )* %inA , i64 %3
365+ %4 = load i64 , i64 addrspace (1 )* %arrayidx , align 8
366+ %call1 = sitofp i64 %4 to double
367+ %arrayidx2 = getelementptr inbounds double , double addrspace (1 )* %out , i64 %3
368+ store double %call1 , double addrspace (1 )* %arrayidx2 , align 8
369+ ret void
370+ }
0 commit comments