@@ -333,3 +333,38 @@ entry:
333
333
store double %call1 , double addrspace (1 )* %arrayidx2 , align 8
334
334
ret void
335
335
}
336
+
337
+ define spir_kernel void @si64tofp_kernel (i64 addrspace (1 )* %inA , double addrspace (1 )* %out , <8 x i32 > %r0 , <8 x i32 > %payloadHeader , <3 x i32 > %enqueuedLocalSize , i16 %localIdX , i16 %localIdY , i16 %localIdZ , i8* %privateBase , i32 %bufferOffset , i32 %bufferOffset1 , i32 %bindlessOffset , i32 %bindlessOffset2 ) #0 {
338
+ ; CHECK-LABEL: @si64tofp_kernel(
339
+ ; CHECK: entry:
340
+ ; CHECK: [[DPEmuFlag:%.*]] = alloca i32
341
+ ; CHECK: [[TMP0:%.*]] = extractelement <8 x i32> %payloadHeader, i64 0
342
+ ; CHECK: [[TMP1:%.*]] = extractelement <3 x i32> %enqueuedLocalSize, i64 0
343
+ ; CHECK: [[TMP2:%.*]] = extractelement <8 x i32> %r0, i64 1
344
+ ; CHECK: [[MUL:%.*]] = mul i32 [[TMP1]], [[TMP2]]
345
+ ; CHECK: [[LOCAL_ID_X:%.*]] = zext i16 %localIdX to i32
346
+ ; CHECK: [[ADD0:%.*]] = add i32 [[MUL]], [[LOCAL_ID_X]]
347
+ ; CHECK: [[ADD1:%.*]] = add i32 [[ADD0]], [[TMP0]]
348
+ ; CHECK: [[CONV0:%.*]] = zext i32 [[ADD1]] to i64
349
+ ; CHECK: [[ARRAY_IDX0:%.*]] = getelementptr inbounds i64, i64 addrspace(1)* %inA, i64 [[CONV0]]
350
+ ; CHECK: [[TMP3:%.*]] = load i64, i64 addrspace(1)* [[ARRAY_IDX0]], align 8
351
+ ; CHECK: [[CALL_TMP:%.*]] = call double @__igcbuiltin_int64_to_dp(i64 [[TMP3]], i32 0, i32* [[DPEmuFlag]])
352
+ ; CHECK: [[ARRAY_IDX1:%.*]] = getelementptr inbounds double, double addrspace(1)* %out, i64 [[CONV0]]
353
+ ; CHECK: store double [[CALL_TMP]], double addrspace(1)* [[ARRAY_IDX1]], align 8
354
+ ; CHECK: ret void
355
+ entry:
356
+ %payloadHeader.scalar = extractelement <8 x i32 > %payloadHeader , i64 0
357
+ %enqueuedLocalSize.scalar = extractelement <3 x i32 > %enqueuedLocalSize , i64 0
358
+ %r0.scalar19 = extractelement <8 x i32 > %r0 , i64 1
359
+ %0 = mul i32 %enqueuedLocalSize.scalar , %r0.scalar19
360
+ %localIdX4 = zext i16 %localIdX to i32
361
+ %1 = add i32 %0 , %localIdX4
362
+ %2 = add i32 %1 , %payloadHeader.scalar
363
+ %3 = zext i32 %2 to i64
364
+ %arrayidx = getelementptr inbounds i64 , i64 addrspace (1 )* %inA , i64 %3
365
+ %4 = load i64 , i64 addrspace (1 )* %arrayidx , align 8
366
+ %call1 = sitofp i64 %4 to double
367
+ %arrayidx2 = getelementptr inbounds double , double addrspace (1 )* %out , i64 %3
368
+ store double %call1 , double addrspace (1 )* %arrayidx2 , align 8
369
+ ret void
370
+ }
0 commit comments