blob: 77ed1d6fecf9ae11cc0cb792ee89cc2c2e555161 [file] [log] [blame]
; This is an excerpt from the SYCL end-to-end test suite, cleaned out from unrelevant details,
; that reproduced multiple cases of the issues when OpPhi's result type mismatches with operand types.
; The only pass criterion is that spirv-val considers output valid.
; RUN: %if spirv-tools %{ llc -O0 -mtriple=spirv64-unknown-unknown %s -o - -filetype=obj | spirv-val %}
%struct.PFWGFunctor = type { i64, i64, i32, i32, %"class.sycl::_V1::accessor" }
%"class.sycl::_V1::accessor" = type { %"class.sycl::_V1::detail::AccessorImplDevice", %union.anon }
%"class.sycl::_V1::detail::AccessorImplDevice" = type { %"class.sycl::_V1::range", %"class.sycl::_V1::range", %"class.sycl::_V1::range" }
%"class.sycl::_V1::range" = type { %"class.sycl::_V1::detail::array" }
%"class.sycl::_V1::detail::array" = type { [1 x i64] }
%union.anon = type { ptr addrspace(1) }
%class.anon.2 = type { %"class.sycl::_V1::accessor" }
%"class.sycl::_V1::group" = type { %"class.sycl::_V1::range", %"class.sycl::_V1::range", %"class.sycl::_V1::range", %"class.sycl::_V1::range" }
%"class.sycl::_V1::group.15" = type { %"class.sycl::_V1::range.16", %"class.sycl::_V1::range.16", %"class.sycl::_V1::range.16", %"class.sycl::_V1::range.16" }
%"class.sycl::_V1::range.16" = type { %"class.sycl::_V1::detail::array.17" }
%"class.sycl::_V1::detail::array.17" = type { [2 x i64] }
%"class.sycl::_V1::private_memory" = type { %struct.MyStruct }
%struct.MyStruct = type { i32, i32 }
@GFunctor = internal addrspace(3) global %struct.PFWGFunctor undef, align 8
@WI.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WI.1 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WI.2 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WI.3 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WI.4 = internal unnamed_addr addrspace(3) global i32 undef, align 8
@WI.6 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@GCnt = internal unnamed_addr addrspace(3) global i32 undef, align 4
@__spirv_BuiltInNumWorkgroups = external dso_local local_unnamed_addr addrspace(1) constant <3 x i64>, align 32
@GKernel1 = internal addrspace(3) global %class.anon.2 undef, align 8
@GCnt2 = internal unnamed_addr addrspace(3) global i32 undef, align 4
@GKernel2 = internal addrspace(3) global %class.anon.2 undef, align 8
@GCnt3 = internal unnamed_addr addrspace(3) global i32 undef, align 4
@GKernel3 = internal addrspace(3) global %class.anon.2 undef, align 8
@GCnt4 = internal unnamed_addr addrspace(3) global i32 undef, align 4
@GKernel4 = internal addrspace(3) global %class.anon.2 undef, align 8
@GCnt5 = internal unnamed_addr addrspace(3) global i32 undef, align 4
@__spirv_BuiltInLocalInvocationIndex = external local_unnamed_addr addrspace(1) constant i64, align 8
@GThis = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@GAsCast = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@GCmp = internal unnamed_addr addrspace(3) global i1 undef, align 1
@WGCopy = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@WGCopy.1.0 = internal unnamed_addr addrspace(3) global i64 undef, align 16
@WGCopy.1.1 = internal unnamed_addr addrspace(3) global i64 undef, align 16
@WGCopy.1.2 = internal unnamed_addr addrspace(3) global i64 undef, align 16
@WGCopy.1.3 = internal unnamed_addr addrspace(3) global i64 undef, align 16
@WGCopy.1.4 = internal unnamed_addr addrspace(3) global i32 undef, align 16
@WGCopy.1.5 = internal unnamed_addr addrspace(3) global i32 undef, align 16
@WGCopy.1.6 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 16
@ArgShadow = internal unnamed_addr addrspace(3) global %"class.sycl::_V1::group" undef, align 16
@GAsCast2 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@GCmp2 = internal unnamed_addr addrspace(3) global i1 undef, align 1
@WGCopy.3.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.4.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.5.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.6.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@ArgShadow.7 = internal unnamed_addr addrspace(3) global %"class.sycl::_V1::group" undef, align 16
@GAscast3 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@GCmp3 = internal unnamed_addr addrspace(3) global i1 undef, align 1
@WGCopy.9.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.10.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@ArgShadow.11 = internal unnamed_addr addrspace(3) global %"class.sycl::_V1::group" undef, align 16
@GAsCast4 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@GCmp4 = internal unnamed_addr addrspace(3) global i1 undef, align 1
@WGCopy.13.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.13.1 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.14.0 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@WGCopy.14.1 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@WGCopy.15.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.15.1 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.16.0 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@WGCopy.16.1 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@ArgShadow.17 = internal unnamed_addr addrspace(3) global %"class.sycl::_V1::group.15" undef, align 16
@GAsCast5 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@GCmp5 = internal unnamed_addr addrspace(3) global i1 undef, align 1
@WGCopy.19.0 = internal unnamed_addr addrspace(3) global i64 undef, align 8
@WGCopy.20.0 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@WGCopy.20.1 = internal unnamed_addr addrspace(3) global ptr addrspace(4) undef, align 8
@ArgShadow.21 = internal unnamed_addr addrspace(3) global %"class.sycl::_V1::group" undef, align 16
@__spirv_BuiltInGlobalInvocationId = external dso_local local_unnamed_addr addrspace(1) constant <3 x i64>, align 32
@__spirv_BuiltInGlobalSize = external dso_local local_unnamed_addr addrspace(1) constant <3 x i64>, align 32
@__spirv_BuiltInLocalInvocationId = external dso_local local_unnamed_addr addrspace(1) constant <3 x i64>, align 32
@__spirv_BuiltInWorkgroupId = external dso_local local_unnamed_addr addrspace(1) constant <3 x i64>, align 32
@__spirv_BuiltInWorkgroupSize = external dso_local local_unnamed_addr addrspace(1) constant <3 x i64>, align 32
; Function Attrs: convergent mustprogress norecurse nounwind
define weak_odr dso_local spir_kernel void @_ZTS11PFWGFunctor(i64 noundef %_arg_wg_chunk, i64 noundef %_arg_range_length, i32 noundef %_arg_n_iter, i32 noundef %_arg_addend, ptr addrspace(1) noundef align 4 %_arg_dev_ptr, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr1, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr2, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr3) {
entry:
%agg.tmp67 = alloca %"class.sycl::_V1::group", align 8
store i64 %_arg_wg_chunk, ptr addrspace(3) @GFunctor, align 8
store i64 %_arg_range_length, ptr addrspace(3) undef, align 8
store i32 %_arg_n_iter, ptr addrspace(3) undef, align 8
store i32 %_arg_addend, ptr addrspace(3) undef, align 4
%0 = load i64, ptr %_arg_dev_ptr1, align 8
%1 = load i64, ptr %_arg_dev_ptr2, align 8
%2 = load i64, ptr %_arg_dev_ptr3, align 8
store i64 %2, ptr addrspace(3) undef, align 8
store i64 %0, ptr addrspace(3) undef, align 8
store i64 %1, ptr addrspace(3) undef, align 8
%add.ptr.i = getelementptr inbounds i32, ptr addrspace(1) %_arg_dev_ptr, i64 %2
store ptr addrspace(1) %add.ptr.i, ptr addrspace(3) undef, align 8
%3 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalSize, align 32
%4 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupSize, align 32
%5 = load i64, ptr addrspace(1) @__spirv_BuiltInNumWorkgroups, align 32
%6 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupId, align 32
call void @llvm.lifetime.start.p0(i64 32, ptr nonnull %agg.tmp67)
store i64 %3, ptr %agg.tmp67, align 1
%agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 8
store i64 %4, ptr %agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 16
store i64 %5, ptr %agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 24
store i64 %6, ptr %agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx, align 1
%7 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationIndex, align 8
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%cmpz15.i = icmp eq i64 %7, 0
br i1 %cmpz15.i, label %leader.i, label %merge.i
leader.i: ; preds = %entry
call void @llvm.memcpy.p3.p0.i64(ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow, ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, i64 32, i1 false)
br label %merge.i
merge.i: ; preds = %leader.i, %entry
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call void @llvm.memcpy.p0.p3.i64(ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow, i64 32, i1 false)
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %wg_leader.i, label %wg_cf.i
wg_leader.i: ; preds = %merge.i
%g.ascast.i = addrspacecast ptr %agg.tmp67 to ptr addrspace(4)
store ptr addrspace(4) %g.ascast.i, ptr addrspace(3) @GAsCast, align 8
store ptr addrspace(4) addrspacecast (ptr addrspace(3) @GFunctor to ptr addrspace(4)), ptr addrspace(3) @GThis, align 8
%8 = load i32, ptr addrspace(3) undef, align 4
%9 = load i64, ptr addrspace(3) @GFunctor, align 8
%index.i = getelementptr inbounds i8, ptr %agg.tmp67, i64 24
%10 = load i64, ptr %index.i, align 8
%mul.i = mul i64 %9, %10
%localRange.i = getelementptr inbounds i8, ptr %agg.tmp67, i64 8
%11 = load i64, ptr %localRange.i, align 8
%12 = load i64, ptr addrspace(3) undef, align 8
store i64 %9, ptr addrspace(3) @WI.0, align 8
store i64 %11, ptr addrspace(3) @WI.1, align 8
store i64 %mul.i, ptr addrspace(3) @WI.2, align 8
store i64 %12, ptr addrspace(3) @WI.3, align 8
store i32 %8, ptr addrspace(3) @WI.4, align 8
store ptr addrspace(4) undef, ptr addrspace(3) @WI.6, align 8
store i32 0, ptr addrspace(3) @GCnt, align 4
br label %wg_cf.i
wg_cf.i: ; preds = %wg_leader.i, %merge.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%wg_val_this1.i = load ptr addrspace(4), ptr addrspace(3) @GThis, align 8
%n_iter.i = getelementptr inbounds i8, ptr addrspace(4) %wg_val_this1.i, i64 16
%13 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationId, align 32
br label %for.cond.i
for.cond.i: ; preds = %wg_cf11.i, %wg_cf.i
%agg.tmp.i.sroa.0.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.0.0.copyload13, %wg_cf11.i ]
%agg.tmp.i.sroa.6.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.6.0.copyload15, %wg_cf11.i ]
%agg.tmp.i.sroa.7.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.7.0.copyload17, %wg_cf11.i ]
%agg.tmp.i.sroa.8.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.8.0.copyload19, %wg_cf11.i ]
%agg.tmp.i.sroa.9.0 = phi i32 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.9.0.copyload21, %wg_cf11.i ]
%agg.tmp.i.sroa.10.0 = phi i32 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.10.0.copyload23, %wg_cf11.i ]
%agg.tmp.i.sroa.11.0 = phi ptr addrspace(4) [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.11.0.copyload25, %wg_cf11.i ]
%this.addr.0.i = phi ptr addrspace(4) [ addrspacecast (ptr addrspace(3) @GFunctor to ptr addrspace(4)), %wg_cf.i ], [ %mat_ld13.i, %wg_cf11.i ]
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %wg_leader4.i, label %wg_cf5.i
wg_leader4.i: ; preds = %for.cond.i
%14 = load i32, ptr addrspace(3) @GCnt, align 4
%15 = load i32, ptr addrspace(4) %n_iter.i, align 8
%cmp.i = icmp slt i32 %14, %15
store i1 %cmp.i, ptr addrspace(3) @GCmp, align 1
br label %wg_cf5.i
wg_cf5.i: ; preds = %wg_leader4.i, %for.cond.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%wg_val_cmp.i = load i1, ptr addrspace(3) @GCmp, align 1
br i1 %wg_val_cmp.i, label %for.body.i, label %_ZNK11PFWGFunctorclEN4sycl3_V15groupILi1EEE.exit
for.body.i: ; preds = %wg_cf5.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %wg_leader7.i, label %wg_cf8.i
wg_leader7.i: ; preds = %for.body.i
%agg.tmp.i.sroa.0.0.copyload = load i64, ptr addrspace(3) @WI.0, align 8
%agg.tmp.i.sroa.6.0.copyload = load i64, ptr addrspace(3) @WI.1, align 8
%agg.tmp.i.sroa.7.0.copyload = load i64, ptr addrspace(3) @WI.2, align 8
%agg.tmp.i.sroa.8.0.copyload = load i64, ptr addrspace(3) @WI.3, align 8
%agg.tmp.i.sroa.9.0.copyload = load i32, ptr addrspace(3) @WI.4, align 8
%agg.tmp.i.sroa.11.0.copyload = load ptr addrspace(4), ptr addrspace(3) @WI.6, align 8
br label %wg_cf8.i
wg_cf8.i: ; preds = %wg_leader7.i, %for.body.i
%agg.tmp.i.sroa.0.1 = phi i64 [ %agg.tmp.i.sroa.0.0.copyload, %wg_leader7.i ], [ %agg.tmp.i.sroa.0.0, %for.body.i ]
%agg.tmp.i.sroa.6.1 = phi i64 [ %agg.tmp.i.sroa.6.0.copyload, %wg_leader7.i ], [ %agg.tmp.i.sroa.6.0, %for.body.i ]
%agg.tmp.i.sroa.7.1 = phi i64 [ %agg.tmp.i.sroa.7.0.copyload, %wg_leader7.i ], [ %agg.tmp.i.sroa.7.0, %for.body.i ]
%agg.tmp.i.sroa.8.1 = phi i64 [ %agg.tmp.i.sroa.8.0.copyload, %wg_leader7.i ], [ %agg.tmp.i.sroa.8.0, %for.body.i ]
%agg.tmp.i.sroa.9.1 = phi i32 [ %agg.tmp.i.sroa.9.0.copyload, %wg_leader7.i ], [ %agg.tmp.i.sroa.9.0, %for.body.i ]
%agg.tmp.i.sroa.11.1 = phi ptr addrspace(4) [ %agg.tmp.i.sroa.11.0.copyload, %wg_leader7.i ], [ %agg.tmp.i.sroa.11.0, %for.body.i ]
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %TestMat.i, label %LeaderMat.i
TestMat.i: ; preds = %wg_cf8.i
store i64 %agg.tmp.i.sroa.0.1, ptr addrspace(3) @WGCopy.1.0, align 16
store i64 %agg.tmp.i.sroa.6.1, ptr addrspace(3) @WGCopy.1.1, align 16
store i64 %agg.tmp.i.sroa.7.1, ptr addrspace(3) @WGCopy.1.2, align 16
store i64 %agg.tmp.i.sroa.8.1, ptr addrspace(3) @WGCopy.1.3, align 16
store i32 %agg.tmp.i.sroa.9.1, ptr addrspace(3) @WGCopy.1.4, align 16
store i32 %agg.tmp.i.sroa.10.0, ptr addrspace(3) @WGCopy.1.5, align 16
store ptr addrspace(4) %agg.tmp.i.sroa.11.1, ptr addrspace(3) @WGCopy.1.6, align 16
store ptr addrspace(4) %this.addr.0.i, ptr addrspace(3) @WGCopy, align 8
br label %LeaderMat.i
LeaderMat.i: ; preds = %TestMat.i, %wg_cf8.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%mat_ld13.i = load ptr addrspace(4), ptr addrspace(3) @WGCopy, align 8
%agg.tmp.i.sroa.0.0.copyload13 = load i64, ptr addrspace(3) @WGCopy.1.0, align 16
%agg.tmp.i.sroa.6.0.copyload15 = load i64, ptr addrspace(3) @WGCopy.1.1, align 16
%agg.tmp.i.sroa.7.0.copyload17 = load i64, ptr addrspace(3) @WGCopy.1.2, align 16
%agg.tmp.i.sroa.8.0.copyload19 = load i64, ptr addrspace(3) @WGCopy.1.3, align 16
%agg.tmp.i.sroa.9.0.copyload21 = load i32, ptr addrspace(3) @WGCopy.1.4, align 16
%agg.tmp.i.sroa.10.0.copyload23 = load i32, ptr addrspace(3) @WGCopy.1.5, align 16
%agg.tmp.i.sroa.11.0.copyload25 = load ptr addrspace(4), ptr addrspace(3) @WGCopy.1.6, align 16
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
%cmp.not.i.i = icmp ult i64 %13, %agg.tmp.i.sroa.0.0.copyload13
br i1 %cmp.not.i.i, label %if.end.i.i, label %lexit1
if.end.i.i: ; preds = %LeaderMat.i
%add.i.i = add i64 %agg.tmp.i.sroa.0.0.copyload13, %agg.tmp.i.sroa.6.0.copyload15
%sub.i.i = add i64 %add.i.i, -1
%div.i.i = udiv i64 %sub.i.i, %agg.tmp.i.sroa.6.0.copyload15
%mul.i.i = mul i64 %13, %div.i.i
%add4.i.i = add i64 %agg.tmp.i.sroa.7.0.copyload17, %mul.i.i
%add6.i.i = add i64 %add4.i.i, %div.i.i
%.sroa.speculated.i.i = call i64 @llvm.umin.i64(i64 %agg.tmp.i.sroa.8.0.copyload19, i64 %add6.i.i)
%16 = getelementptr inbounds i8, ptr addrspace(4) %agg.tmp.i.sroa.11.0.copyload25, i64 24
br label %for.cond.i.i
for.cond.i.i: ; preds = %for.body.i.i, %if.end.i.i
%ind.0.i.i = phi i64 [ %add4.i.i, %if.end.i.i ], [ %inc.i.i, %for.body.i.i ]
%cmp8.i.i = icmp ult i64 %ind.0.i.i, %.sroa.speculated.i.i
br i1 %cmp8.i.i, label %for.body.i.i, label %lexit1
for.body.i.i: ; preds = %for.cond.i.i
%17 = load ptr addrspace(1), ptr addrspace(4) %16, align 8
%arrayidx.i.i.i = getelementptr inbounds i32, ptr addrspace(1) %17, i64 %ind.0.i.i
%18 = load i32, ptr addrspace(1) %arrayidx.i.i.i, align 4
%add10.i.i = add nsw i32 %18, %agg.tmp.i.sroa.9.0.copyload21
store i32 %add10.i.i, ptr addrspace(1) %arrayidx.i.i.i, align 4
%inc.i.i = add nuw i64 %ind.0.i.i, 1
br label %for.cond.i.i
lexit1: ; preds = %for.cond.i.i, %LeaderMat.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %wg_leader10.i, label %wg_cf11.i
wg_leader10.i: ; preds = %lexit1
%19 = load i32, ptr addrspace(3) @GCnt, align 4
%inc.i = add nsw i32 %19, 1
store i32 %inc.i, ptr addrspace(3) @GCnt, align 4
br label %wg_cf11.i
wg_cf11.i: ; preds = %wg_leader10.i, %lexit1
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br label %for.cond.i
_ZNK11PFWGFunctorclEN4sycl3_V15groupILi1EEE.exit: ; preds = %wg_cf5.i
call void @llvm.lifetime.end.p0(i64 32, ptr nonnull %agg.tmp67)
ret void
}
; Function Attrs: nocallback nofree nosync nounwind willreturn memory(argmem: readwrite)
declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture)
; Function Attrs: convergent nounwind
declare dso_local spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef, i32 noundef, i32 noundef)
; Function Attrs: nocallback nofree nounwind willreturn memory(argmem: readwrite)
declare void @llvm.memcpy.p3.p0.i64(ptr addrspace(3) noalias nocapture writeonly, ptr noalias nocapture readonly, i64, i1 immarg)
; Function Attrs: nocallback nofree nounwind willreturn memory(argmem: readwrite)
declare void @llvm.memcpy.p0.p3.i64(ptr noalias nocapture writeonly, ptr addrspace(3) noalias nocapture readonly, i64, i1 immarg)
; Function Attrs: nocallback nofree nosync nounwind speculatable willreturn memory(none)
declare i64 @llvm.umin.i64(i64, i64)
; Function Attrs: nocallback nofree nosync nounwind willreturn memory(argmem: readwrite)
declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture)
; Function Attrs: convergent mustprogress norecurse nounwind
define weak_odr dso_local spir_kernel void @bar(ptr addrspace(1) noundef align 4 %_arg_dev_ptr, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr1, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr2, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr3) {
entry:
%agg.tmp67 = alloca %"class.sycl::_V1::group", align 8
%0 = load i64, ptr %_arg_dev_ptr1, align 8
%1 = load i64, ptr %_arg_dev_ptr2, align 8
%2 = load i64, ptr %_arg_dev_ptr3, align 8
store i64 %2, ptr addrspace(3) @GKernel1, align 8
store i64 %0, ptr addrspace(3) undef, align 8
store i64 %1, ptr addrspace(3) undef, align 8
%add.ptr.i = getelementptr inbounds i32, ptr addrspace(1) %_arg_dev_ptr, i64 %2
store ptr addrspace(1) %add.ptr.i, ptr addrspace(3) undef, align 8
%3 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalSize, align 32
%4 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupSize, align 32
%5 = load i64, ptr addrspace(1) @__spirv_BuiltInNumWorkgroups, align 32
%6 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupId, align 32
call void @llvm.lifetime.start.p0(i64 32, ptr nonnull %agg.tmp67)
store i64 %3, ptr %agg.tmp67, align 1
%agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 8
store i64 %4, ptr %agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 16
store i64 %5, ptr %agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 24
store i64 %6, ptr %agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx, align 1
%7 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationIndex, align 8
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%cmpz27.i = icmp eq i64 %7, 0
br i1 %cmpz27.i, label %leader.i, label %merge.i
leader.i: ; preds = %entry
call void @llvm.memcpy.p3.p0.i64(ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow.7, ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, i64 32, i1 false)
br label %merge.i
merge.i: ; preds = %leader.i, %entry
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call void @llvm.memcpy.p0.p3.i64(ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow.7, i64 32, i1 false)
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz27.i, label %wg_leader.i, label %wg_cf.i
wg_leader.i: ; preds = %merge.i
%g.ascast.i = addrspacecast ptr %agg.tmp67 to ptr addrspace(4)
store ptr addrspace(4) %g.ascast.i, ptr addrspace(3) @GAsCast2, align 8
store i32 0, ptr addrspace(3) @GCnt2, align 4
br label %wg_cf.i
wg_cf.i: ; preds = %wg_leader.i, %merge.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%8 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalInvocationId, align 32
%9 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationId, align 32
%cmp.i.i.i.i.i.i = icmp ult i64 %8, 2147483648
br label %for.cond.i
for.cond.i: ; preds = %wg_cf18.i, %wg_cf.i
%agg.tmp5.i.sroa.0.0 = phi i64 [ undef, %wg_cf.i ], [ %18, %wg_cf18.i ]
%agg.tmp4.i.sroa.0.0 = phi i64 [ undef, %wg_cf.i ], [ %17, %wg_cf18.i ]
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz27.i, label %wg_leader8.i, label %wg_cf9.i
wg_leader8.i: ; preds = %for.cond.i
%10 = load i32, ptr addrspace(3) @GCnt2, align 4
%cmp.i = icmp slt i32 %10, 2
store i1 %cmp.i, ptr addrspace(3) @GCmp2, align 1
br label %wg_cf9.i
wg_cf9.i: ; preds = %wg_leader8.i, %for.cond.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%wg_val_cmp.i = load i1, ptr addrspace(3) @GCmp2, align 1
br i1 %wg_val_cmp.i, label %for.body.i, label %lexit2
for.body.i: ; preds = %wg_cf9.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz27.i, label %TestMat25.i, label %LeaderMat22.i
TestMat25.i: ; preds = %for.body.i
store i64 %agg.tmp5.i.sroa.0.0, ptr addrspace(3) @WGCopy.6.0, align 8
store i64 ptrtoint (ptr addrspace(4) addrspacecast (ptr addrspace(3) @GKernel1 to ptr addrspace(4)) to i64), ptr addrspace(3) @WGCopy.4.0, align 8
store i64 5, ptr addrspace(3) @WGCopy.3.0, align 8
store i64 %agg.tmp4.i.sroa.0.0, ptr addrspace(3) @WGCopy.5.0, align 8
br label %LeaderMat22.i
LeaderMat22.i: ; preds = %TestMat25.i, %for.body.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%11 = load i64, ptr addrspace(3) @WGCopy.3.0, align 8
%12 = load i64, ptr addrspace(3) @WGCopy.4.0, align 8
%13 = inttoptr i64 %12 to ptr addrspace(4)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
%14 = getelementptr inbounds i8, ptr addrspace(4) %13, i64 24
br label %for.cond.i.i
for.cond.i.i: ; preds = %for.body.i.i, %LeaderMat22.i
%storemerge.i.i = phi i64 [ %9, %LeaderMat22.i ], [ %add.i.i, %for.body.i.i ]
%cmp.i.i = icmp ult i64 %storemerge.i.i, %11
br i1 %cmp.i.i, label %for.body.i.i, label %lexit3
for.body.i.i: ; preds = %for.cond.i.i
call void @llvm.assume(i1 %cmp.i.i.i.i.i.i)
%15 = load ptr addrspace(1), ptr addrspace(4) %14, align 8
%arrayidx.i.i.i.i.i = getelementptr inbounds i32, ptr addrspace(1) %15, i64 %8
%16 = load i32, ptr addrspace(1) %arrayidx.i.i.i.i.i, align 4
%inc.i.i.i.i = add nsw i32 %16, 1
store i32 %inc.i.i.i.i, ptr addrspace(1) %arrayidx.i.i.i.i.i, align 4
%add.i.i = add i64 %storemerge.i.i, %4
br label %for.cond.i.i
lexit3: ; preds = %for.cond.i.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz27.i, label %TestMat.i, label %LeaderMat.i
TestMat.i: ; preds = %lexit3
store i64 ptrtoint (ptr addrspace(4) addrspacecast (ptr addrspace(3) @GKernel1 to ptr addrspace(4)) to i64), ptr addrspace(3) @WGCopy.6.0, align 8
store i64 %12, ptr addrspace(3) @WGCopy.4.0, align 8
store i64 %11, ptr addrspace(3) @WGCopy.3.0, align 8
store i64 2, ptr addrspace(3) @WGCopy.5.0, align 8
br label %LeaderMat.i
LeaderMat.i: ; preds = %TestMat.i, %lexit3
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%17 = load i64, ptr addrspace(3) @WGCopy.5.0, align 8
%18 = load i64, ptr addrspace(3) @WGCopy.6.0, align 8
%19 = inttoptr i64 %18 to ptr addrspace(4)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
%20 = getelementptr inbounds i8, ptr addrspace(4) %19, i64 24
br label %for.cond.i.i19
for.cond.i.i19: ; preds = %for.body.i.i22, %LeaderMat.i
%storemerge.i.i20 = phi i64 [ %9, %LeaderMat.i ], [ %add.i.i26, %for.body.i.i22 ]
%cmp.i.i21 = icmp ult i64 %storemerge.i.i20, %17
br i1 %cmp.i.i21, label %for.body.i.i22, label %lexit4
for.body.i.i22: ; preds = %for.cond.i.i19
call void @llvm.assume(i1 %cmp.i.i.i.i.i.i)
%21 = load ptr addrspace(1), ptr addrspace(4) %20, align 8
%arrayidx.i.i.i.i.i23 = getelementptr inbounds i32, ptr addrspace(1) %21, i64 %8
%22 = load i32, ptr addrspace(1) %arrayidx.i.i.i.i.i23, align 4
%inc.i.i.i.i25 = add nsw i32 %22, 1
store i32 %inc.i.i.i.i25, ptr addrspace(1) %arrayidx.i.i.i.i.i23, align 4
%add.i.i26 = add i64 %storemerge.i.i20, %4
br label %for.cond.i.i19
lexit4: ; preds = %for.cond.i.i19
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz27.i, label %wg_leader17.i, label %wg_cf18.i
wg_leader17.i: ; preds = %lexit4
%23 = load i32, ptr addrspace(3) @GCnt2, align 4
%inc.i = add nsw i32 %23, 1
store i32 %inc.i, ptr addrspace(3) @GCnt2, align 4
br label %wg_cf18.i
wg_cf18.i: ; preds = %wg_leader17.i, %lexit4
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br label %for.cond.i
lexit2: ; preds = %wg_cf9.i
call void @llvm.lifetime.end.p0(i64 32, ptr nonnull %agg.tmp67)
ret void
}
; Function Attrs: nocallback nofree nosync nounwind willreturn memory(inaccessiblemem: write)
declare void @llvm.assume(i1 noundef)
; Function Attrs: convergent mustprogress norecurse nounwind
define weak_odr dso_local spir_kernel void @test1(ptr addrspace(1) noundef align 4 %_arg_dev_ptr, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr1, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr2, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr3) {
entry:
%agg.tmp67 = alloca %"class.sycl::_V1::group", align 8
%0 = load i64, ptr %_arg_dev_ptr1, align 8
%1 = load i64, ptr %_arg_dev_ptr2, align 8
%2 = load i64, ptr %_arg_dev_ptr3, align 8
store i64 %2, ptr addrspace(3) @GKernel2, align 8
store i64 %0, ptr addrspace(3) undef, align 8
store i64 %1, ptr addrspace(3) undef, align 8
%add.ptr.i = getelementptr inbounds i32, ptr addrspace(1) %_arg_dev_ptr, i64 %2
store ptr addrspace(1) %add.ptr.i, ptr addrspace(3) undef, align 8
%3 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalSize, align 32
%4 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupSize, align 32
%5 = load i64, ptr addrspace(1) @__spirv_BuiltInNumWorkgroups, align 32
%6 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupId, align 32
call void @llvm.lifetime.start.p0(i64 32, ptr nonnull %agg.tmp67)
store i64 %3, ptr %agg.tmp67, align 1
%agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 8
store i64 %4, ptr %agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 16
store i64 %5, ptr %agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 24
store i64 %6, ptr %agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx, align 1
%7 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationIndex, align 8
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%cmpz15.i = icmp eq i64 %7, 0
br i1 %cmpz15.i, label %leader.i, label %merge.i
leader.i: ; preds = %entry
call void @llvm.memcpy.p3.p0.i64(ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow.11, ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, i64 32, i1 false)
br label %merge.i
merge.i: ; preds = %leader.i, %entry
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call void @llvm.memcpy.p0.p3.i64(ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow.11, i64 32, i1 false)
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %wg_leader.i, label %wg_cf.i
wg_leader.i: ; preds = %merge.i
%g.ascast.i = addrspacecast ptr %agg.tmp67 to ptr addrspace(4)
store ptr addrspace(4) %g.ascast.i, ptr addrspace(3) @GAscast3, align 8
store i32 0, ptr addrspace(3) @GCnt3, align 4
br label %wg_cf.i
wg_cf.i: ; preds = %wg_leader.i, %merge.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%8 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalInvocationId, align 32
%9 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationId, align 32
%cmp.i.i.i.i.i.i = icmp ult i64 %8, 2147483648
br label %for.cond.i
for.cond.i: ; preds = %wg_cf11.i, %wg_cf.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %wg_leader4.i, label %wg_cf5.i
wg_leader4.i: ; preds = %for.cond.i
%10 = load i32, ptr addrspace(3) @GCnt3, align 4
%cmp.i = icmp slt i32 %10, 2
store i1 %cmp.i, ptr addrspace(3) @GCmp3, align 1
br label %wg_cf5.i
wg_cf5.i: ; preds = %wg_leader4.i, %for.cond.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%wg_val_cmp.i = load i1, ptr addrspace(3) @GCmp3, align 1
br i1 %wg_val_cmp.i, label %for.body.i, label %lexit6
for.body.i: ; preds = %wg_cf5.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %TestMat.i, label %LeaderMat.i
TestMat.i: ; preds = %for.body.i
store i64 ptrtoint (ptr addrspace(4) addrspacecast (ptr addrspace(3) @GKernel2 to ptr addrspace(4)) to i64), ptr addrspace(3) @WGCopy.10.0, align 8
store i64 5, ptr addrspace(3) @WGCopy.9.0, align 8
br label %LeaderMat.i
LeaderMat.i: ; preds = %TestMat.i, %for.body.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%11 = load i64, ptr addrspace(3) @WGCopy.9.0, align 8
%12 = load i64, ptr addrspace(3) @WGCopy.10.0, align 8
%13 = inttoptr i64 %12 to ptr addrspace(4)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
%14 = getelementptr inbounds i8, ptr addrspace(4) %13, i64 24
br label %for.cond.i.i
for.cond.i.i: ; preds = %for.body.i.i, %LeaderMat.i
%storemerge.i.i = phi i64 [ %9, %LeaderMat.i ], [ %add.i.i, %for.body.i.i ]
%cmp.i.i = icmp ult i64 %storemerge.i.i, %11
br i1 %cmp.i.i, label %for.body.i.i, label %lexit7
for.body.i.i: ; preds = %for.cond.i.i
%cmp5.not.i.i.i.i.i.i = icmp ne i64 %storemerge.i.i, %9
%cond.i.i.i.i = zext i1 %cmp5.not.i.i.i.i.i.i to i32
call void @llvm.assume(i1 %cmp.i.i.i.i.i.i)
%15 = load ptr addrspace(1), ptr addrspace(4) %14, align 8
%arrayidx.i.i.i.i.i = getelementptr inbounds i32, ptr addrspace(1) %15, i64 %8
%16 = load i32, ptr addrspace(1) %arrayidx.i.i.i.i.i, align 4
%add.i.i.i.i = add nsw i32 %16, %cond.i.i.i.i
store i32 %add.i.i.i.i, ptr addrspace(1) %arrayidx.i.i.i.i.i, align 4
%add.i.i = add i64 %storemerge.i.i, %4
br label %for.cond.i.i
lexit7: ; preds = %for.cond.i.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz15.i, label %wg_leader10.i, label %wg_cf11.i
wg_leader10.i: ; preds = %lexit7
%17 = load i32, ptr addrspace(3) @GCnt3, align 4
%inc.i = add nsw i32 %17, 1
store i32 %inc.i, ptr addrspace(3) @GCnt3, align 4
br label %wg_cf11.i
wg_cf11.i: ; preds = %wg_leader10.i, %lexit7
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br label %for.cond.i
lexit6: ; preds = %wg_cf5.i
call void @llvm.lifetime.end.p0(i64 32, ptr nonnull %agg.tmp67)
ret void
}
; Function Attrs: convergent mustprogress norecurse nounwind
define weak_odr dso_local spir_kernel void @test2(ptr addrspace(1) noundef align 4 %_arg_dev_ptr, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr1, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr2, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr3) {
entry:
%priv.i = alloca %"class.sycl::_V1::private_memory", align 4
%agg.tmp67 = alloca %"class.sycl::_V1::group.15", align 8
%0 = load i64, ptr %_arg_dev_ptr1, align 8
%1 = load i64, ptr %_arg_dev_ptr2, align 8
%2 = load i64, ptr %_arg_dev_ptr3, align 8
store i64 %2, ptr addrspace(3) @GKernel3, align 8
store i64 %0, ptr addrspace(3) undef, align 8
store i64 %1, ptr addrspace(3) undef, align 8
%add.ptr.i = getelementptr inbounds i32, ptr addrspace(1) %_arg_dev_ptr, i64 %2
store ptr addrspace(1) %add.ptr.i, ptr addrspace(3) undef, align 8
%3 = load i64, ptr addrspace(1) undef, align 8
%4 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalSize, align 32
%5 = load i64, ptr addrspace(1) undef, align 8
%6 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupSize, align 32
%7 = load i64, ptr addrspace(1) undef, align 8
%8 = load i64, ptr addrspace(1) @__spirv_BuiltInNumWorkgroups, align 32
%9 = load i64, ptr addrspace(1) undef, align 8
%10 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupId, align 32
call void @llvm.lifetime.start.p0(i64 64, ptr nonnull %agg.tmp67)
store i64 %3, ptr %agg.tmp67, align 1
%agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 8
store i64 %4, ptr %agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 16
store i64 %5, ptr %agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 24
store i64 %6, ptr %agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.5.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 32
store i64 %7, ptr %agg.tmp6.sroa.5.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.6.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 40
store i64 %8, ptr %agg.tmp6.sroa.6.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.7.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 48
store i64 %9, ptr %agg.tmp6.sroa.7.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.8.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 56
store i64 %10, ptr %agg.tmp6.sroa.8.0.agg.tmp67.sroa_idx, align 1
%11 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationIndex, align 8
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%cmpz32.i = icmp eq i64 %11, 0
br i1 %cmpz32.i, label %leader.i, label %merge.i
leader.i: ; preds = %entry
call void @llvm.memcpy.p3.p0.i64(ptr addrspace(3) noundef align 16 dereferenceable(64) @ArgShadow.17, ptr noundef nonnull align 8 dereferenceable(64) %agg.tmp67, i64 64, i1 false)
br label %merge.i
merge.i: ; preds = %leader.i, %entry
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call void @llvm.memcpy.p0.p3.i64(ptr noundef nonnull align 8 dereferenceable(64) %agg.tmp67, ptr addrspace(3) noundef align 16 dereferenceable(64) @ArgShadow.17, i64 64, i1 false)
%priv.ascast.i = addrspacecast ptr %priv.i to ptr addrspace(4)
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %wg_leader.i, label %wg_cf.i
wg_leader.i: ; preds = %merge.i
%g.ascast.i = addrspacecast ptr %agg.tmp67 to ptr addrspace(4)
store ptr addrspace(4) %g.ascast.i, ptr addrspace(3) @GAsCast4, align 8
call void @llvm.lifetime.start.p0(i64 8, ptr nonnull %priv.i)
store i32 0, ptr addrspace(3) @GCnt4, align 4
br label %wg_cf.i
wg_cf.i: ; preds = %wg_leader.i, %merge.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%12 = load i64, ptr addrspace(1) undef, align 8
%13 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalInvocationId, align 32
%14 = load i64, ptr addrspace(1) undef, align 8
%15 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationId, align 32
%mul.i.i.i.i.i.i = mul i64 %12, %4
%add.i.i.i.i.i.i = add i64 %mul.i.i.i.i.i.i, %13
%cmp.i.i.i.i.i.i = icmp ult i64 %add.i.i.i.i.i.i, 2147483648
%conv.i.i.i.i.i = trunc i64 %add.i.i.i.i.i.i to i32
%y.i.i.i.i.i = getelementptr inbounds i8, ptr %priv.i, i64 4
br label %for.cond.i
for.cond.i: ; preds = %wg_cf20.i, %wg_cf.i
%agg.tmp6.i.sroa.9.0 = phi ptr addrspace(4) [ undef, %wg_cf.i ], [ %agg.tmp6.i.sroa.9.0.copyload40, %wg_cf20.i ]
%agg.tmp5.i.sroa.0.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp5.i.sroa.0.0.copyload44, %wg_cf20.i ]
%agg.tmp5.i.sroa.8.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp5.i.sroa.8.0.copyload48, %wg_cf20.i ]
%agg.tmp2.i.sroa.0.0 = phi ptr addrspace(4) [ undef, %wg_cf.i ], [ %agg.tmp2.i.sroa.0.0.copyload52, %wg_cf20.i ]
%agg.tmp2.i.sroa.8.0 = phi ptr addrspace(4) [ undef, %wg_cf.i ], [ %agg.tmp2.i.sroa.8.0.copyload56, %wg_cf20.i ]
%agg.tmp.i.sroa.0.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.0.0.copyload60, %wg_cf20.i ]
%agg.tmp.i.sroa.8.0 = phi i64 [ undef, %wg_cf.i ], [ %agg.tmp.i.sroa.8.0.copyload64, %wg_cf20.i ]
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %wg_leader10.i, label %wg_cf11.i
wg_leader10.i: ; preds = %for.cond.i
%16 = load i32, ptr addrspace(3) @GCnt4, align 4
%cmp.i = icmp slt i32 %16, 2
store i1 %cmp.i, ptr addrspace(3) @GCmp4, align 1
br label %wg_cf11.i
wg_cf11.i: ; preds = %wg_leader10.i, %for.cond.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%wg_val_cmp.i = load i1, ptr addrspace(3) @GCmp4, align 1
br i1 %wg_val_cmp.i, label %for.body.i, label %for.end.i
for.body.i: ; preds = %wg_cf11.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %wg_leader13.i, label %wg_cf14.i
wg_leader13.i: ; preds = %for.body.i
br label %wg_cf14.i
wg_cf14.i: ; preds = %wg_leader13.i, %for.body.i
%agg.tmp2.i.sroa.0.1 = phi ptr addrspace(4) [ addrspacecast (ptr addrspace(3) @GKernel3 to ptr addrspace(4)), %wg_leader13.i ], [ %agg.tmp2.i.sroa.0.0, %for.body.i ]
%agg.tmp2.i.sroa.8.1 = phi ptr addrspace(4) [ %priv.ascast.i, %wg_leader13.i ], [ %agg.tmp2.i.sroa.8.0, %for.body.i ]
%agg.tmp.i.sroa.0.1 = phi i64 [ 7, %wg_leader13.i ], [ %agg.tmp.i.sroa.0.0, %for.body.i ]
%agg.tmp.i.sroa.8.1 = phi i64 [ 3, %wg_leader13.i ], [ %agg.tmp.i.sroa.8.0, %for.body.i ]
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %TestMat30.i, label %LeaderMat27.i
TestMat30.i: ; preds = %wg_cf14.i
store i64 %agg.tmp.i.sroa.0.1, ptr addrspace(3) @WGCopy.13.0, align 8
store i64 %agg.tmp.i.sroa.8.1, ptr addrspace(3) @WGCopy.13.1, align 8
store ptr addrspace(4) %agg.tmp2.i.sroa.0.1, ptr addrspace(3) @WGCopy.14.0, align 8
store ptr addrspace(4) %agg.tmp2.i.sroa.8.1, ptr addrspace(3) @WGCopy.14.1, align 8
store i64 %agg.tmp5.i.sroa.0.0, ptr addrspace(3) @WGCopy.15.0, align 8
store i64 %agg.tmp5.i.sroa.8.0, ptr addrspace(3) @WGCopy.15.1, align 8
store ptr addrspace(4) %priv.ascast.i, ptr addrspace(3) @WGCopy.16.0, align 8
store ptr addrspace(4) %agg.tmp6.i.sroa.9.0, ptr addrspace(3) @WGCopy.16.1, align 8
br label %LeaderMat27.i
LeaderMat27.i: ; preds = %TestMat30.i, %wg_cf14.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%agg.tmp6.i.sroa.0.0.copyload = load ptr addrspace(4), ptr addrspace(3) @WGCopy.16.0, align 8
%agg.tmp6.i.sroa.9.0.copyload = load ptr addrspace(4), ptr addrspace(3) @WGCopy.16.1, align 8
%agg.tmp5.i.sroa.0.0.copyload = load i64, ptr addrspace(3) @WGCopy.15.0, align 8
%agg.tmp5.i.sroa.8.0.copyload = load i64, ptr addrspace(3) @WGCopy.15.1, align 8
%agg.tmp2.i.sroa.0.0.copyload = load ptr addrspace(4), ptr addrspace(3) @WGCopy.14.0, align 8
%agg.tmp.i.sroa.0.0.copyload = load i64, ptr addrspace(3) @WGCopy.13.0, align 8
%agg.tmp.i.sroa.8.0.copyload = load i64, ptr addrspace(3) @WGCopy.13.1, align 8
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
%17 = getelementptr inbounds i8, ptr addrspace(4) %agg.tmp2.i.sroa.0.0.copyload, i64 24
br label %for.cond.i.i
for.cond.i.i: ; preds = %lexit10, %LeaderMat27.i
%storemerge.i.i = phi i64 [ %14, %LeaderMat27.i ], [ %add.i.i, %lexit10 ]
%cmp.i.i = icmp ult i64 %storemerge.i.i, %agg.tmp.i.sroa.0.0.copyload
br i1 %cmp.i.i, label %for.cond.i.i.i, label %lexit11
for.cond.i.i.i: ; preds = %for.body.i.i.i, %for.cond.i.i
%storemerge.i.i.i = phi i64 [ %add.i.i.i, %for.body.i.i.i ], [ %15, %for.cond.i.i ]
%cmp.i.i.i = icmp ult i64 %storemerge.i.i.i, %agg.tmp.i.sroa.8.0.copyload
br i1 %cmp.i.i.i, label %for.body.i.i.i, label %lexit10
for.body.i.i.i: ; preds = %for.cond.i.i.i
call void @llvm.assume(i1 %cmp.i.i.i.i.i.i)
%18 = load ptr addrspace(1), ptr addrspace(4) %17, align 8
%arrayidx.i.i.i.i.i.i = getelementptr inbounds i32, ptr addrspace(1) %18, i64 %add.i.i.i.i.i.i
%19 = load i32, ptr addrspace(1) %arrayidx.i.i.i.i.i.i, align 4
%inc.i.i.i.i.i = add nsw i32 %19, 1
store i32 %inc.i.i.i.i.i, ptr addrspace(1) %arrayidx.i.i.i.i.i.i, align 4
store i32 %conv.i.i.i.i.i, ptr %priv.i, align 4
store i32 5, ptr %y.i.i.i.i.i, align 4
%add.i.i.i = add i64 %storemerge.i.i.i, %6
br label %for.cond.i.i.i
lexit10: ; preds = %for.cond.i.i.i
%add.i.i = add i64 %storemerge.i.i, %5
br label %for.cond.i.i
lexit11: ; preds = %for.cond.i.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %wg_leader16.i, label %wg_cf17.i
wg_leader16.i: ; preds = %lexit11
br label %wg_cf17.i
wg_cf17.i: ; preds = %wg_leader16.i, %lexit11
%agg.tmp6.i.sroa.0.1 = phi ptr addrspace(4) [ %priv.ascast.i, %wg_leader16.i ], [ %agg.tmp6.i.sroa.0.0.copyload, %lexit11 ]
%agg.tmp6.i.sroa.9.1 = phi ptr addrspace(4) [ addrspacecast (ptr addrspace(3) @GKernel3 to ptr addrspace(4)), %wg_leader16.i ], [ %agg.tmp6.i.sroa.9.0.copyload, %lexit11 ]
%agg.tmp5.i.sroa.0.1 = phi i64 [ 7, %wg_leader16.i ], [ %agg.tmp5.i.sroa.0.0.copyload, %lexit11 ]
%agg.tmp5.i.sroa.8.1 = phi i64 [ 3, %wg_leader16.i ], [ %agg.tmp5.i.sroa.8.0.copyload, %lexit11 ]
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %TestMat.i, label %LeaderMat.i
TestMat.i: ; preds = %wg_cf17.i
store i64 %agg.tmp.i.sroa.0.0.copyload, ptr addrspace(3) @WGCopy.13.0, align 8
store i64 %agg.tmp.i.sroa.8.0.copyload, ptr addrspace(3) @WGCopy.13.1, align 8
store ptr addrspace(4) %agg.tmp2.i.sroa.0.0.copyload, ptr addrspace(3) @WGCopy.14.0, align 8
store ptr addrspace(4) %priv.ascast.i, ptr addrspace(3) @WGCopy.14.1, align 8
store i64 %agg.tmp5.i.sroa.0.1, ptr addrspace(3) @WGCopy.15.0, align 8
store i64 %agg.tmp5.i.sroa.8.1, ptr addrspace(3) @WGCopy.15.1, align 8
store ptr addrspace(4) %agg.tmp6.i.sroa.0.1, ptr addrspace(3) @WGCopy.16.0, align 8
store ptr addrspace(4) %agg.tmp6.i.sroa.9.1, ptr addrspace(3) @WGCopy.16.1, align 8
br label %LeaderMat.i
LeaderMat.i: ; preds = %TestMat.i, %wg_cf17.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%agg.tmp6.i.sroa.9.0.copyload40 = load ptr addrspace(4), ptr addrspace(3) @WGCopy.16.1, align 8
%agg.tmp5.i.sroa.0.0.copyload44 = load i64, ptr addrspace(3) @WGCopy.15.0, align 8
%agg.tmp5.i.sroa.8.0.copyload48 = load i64, ptr addrspace(3) @WGCopy.15.1, align 8
%agg.tmp2.i.sroa.0.0.copyload52 = load ptr addrspace(4), ptr addrspace(3) @WGCopy.14.0, align 8
%agg.tmp2.i.sroa.8.0.copyload56 = load ptr addrspace(4), ptr addrspace(3) @WGCopy.14.1, align 8
%agg.tmp.i.sroa.0.0.copyload60 = load i64, ptr addrspace(3) @WGCopy.13.0, align 8
%agg.tmp.i.sroa.8.0.copyload64 = load i64, ptr addrspace(3) @WGCopy.13.1, align 8
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
%20 = getelementptr inbounds i8, ptr addrspace(4) %agg.tmp6.i.sroa.9.0.copyload40, i64 24
br label %for.cond.i.i25
for.cond.i.i25: ; preds = %lexit12, %LeaderMat.i
%storemerge.i.i26 = phi i64 [ %14, %LeaderMat.i ], [ %add.i.i31, %lexit12 ]
%cmp.i.i27 = icmp ult i64 %storemerge.i.i26, %agg.tmp5.i.sroa.0.0.copyload44
br i1 %cmp.i.i27, label %for.cond.i.i.i28, label %lexit13
for.cond.i.i.i28: ; preds = %for.body.i.i.i32, %for.cond.i.i25
%storemerge.i.i.i29 = phi i64 [ %add.i.i.i35, %for.body.i.i.i32 ], [ %15, %for.cond.i.i25 ]
%cmp.i.i.i30 = icmp ult i64 %storemerge.i.i.i29, %agg.tmp5.i.sroa.8.0.copyload48
br i1 %cmp.i.i.i30, label %for.body.i.i.i32, label %lexit12
for.body.i.i.i32: ; preds = %for.cond.i.i.i28
%21 = load i32, ptr %priv.i, align 4
%22 = load i32, ptr %y.i.i.i.i.i, align 4
%add.i.i.i.i.i = add nsw i32 %21, %22
call void @llvm.assume(i1 %cmp.i.i.i.i.i.i)
%23 = load ptr addrspace(1), ptr addrspace(4) %20, align 8
%arrayidx.i.i.i.i.i.i33 = getelementptr inbounds i32, ptr addrspace(1) %23, i64 %add.i.i.i.i.i.i
%24 = load i32, ptr addrspace(1) %arrayidx.i.i.i.i.i.i33, align 4
%add4.i.i.i.i.i = add nsw i32 %24, %add.i.i.i.i.i
store i32 %add4.i.i.i.i.i, ptr addrspace(1) %arrayidx.i.i.i.i.i.i33, align 4
%add.i.i.i35 = add i64 %storemerge.i.i.i29, %6
br label %for.cond.i.i.i28
lexit12: ; preds = %for.cond.i.i.i28
%add.i.i31 = add i64 %storemerge.i.i26, %5
br label %for.cond.i.i25
lexit13: ; preds = %for.cond.i.i25
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %wg_leader19.i, label %wg_cf20.i
wg_leader19.i: ; preds = %lexit13
%25 = load i32, ptr addrspace(3) @GCnt4, align 4
%inc.i = add nsw i32 %25, 1
store i32 %inc.i, ptr addrspace(3) @GCnt4, align 4
br label %wg_cf20.i
wg_cf20.i: ; preds = %wg_leader19.i, %lexit13
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br label %for.cond.i
for.end.i: ; preds = %wg_cf11.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz32.i, label %wg_leader22.i, label %lexit14
wg_leader22.i: ; preds = %for.end.i
call void @llvm.lifetime.end.p0(i64 8, ptr nonnull %priv.i)
br label %lexit14
lexit14: ; preds = %wg_leader22.i, %for.end.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call void @llvm.lifetime.end.p0(i64 64, ptr nonnull %agg.tmp67)
ret void
}
; Function Attrs: convergent mustprogress norecurse nounwind
define weak_odr dso_local spir_kernel void @test3(ptr addrspace(1) noundef align 4 %_arg_dev_ptr, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr1, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr2, ptr noundef byval(%"class.sycl::_V1::range") align 8 %_arg_dev_ptr3) {
entry:
%agg.tmp67 = alloca %"class.sycl::_V1::group", align 8
%0 = load i64, ptr %_arg_dev_ptr1, align 8
%1 = load i64, ptr %_arg_dev_ptr2, align 8
%2 = load i64, ptr %_arg_dev_ptr3, align 8
store i64 %2, ptr addrspace(3) @GKernel4, align 8
store i64 %0, ptr addrspace(3) undef, align 8
store i64 %1, ptr addrspace(3) undef, align 8
%add.ptr.i = getelementptr inbounds i32, ptr addrspace(1) %_arg_dev_ptr, i64 %2
store ptr addrspace(1) %add.ptr.i, ptr addrspace(3) undef, align 8
%3 = load i64, ptr addrspace(1) @__spirv_BuiltInGlobalSize, align 32
%4 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupSize, align 32
%5 = load i64, ptr addrspace(1) @__spirv_BuiltInNumWorkgroups, align 32
%6 = load i64, ptr addrspace(1) @__spirv_BuiltInWorkgroupId, align 32
call void @llvm.lifetime.start.p0(i64 32, ptr nonnull %agg.tmp67)
store i64 %3, ptr %agg.tmp67, align 1
%agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 8
store i64 %4, ptr %agg.tmp6.sroa.2.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 16
store i64 %5, ptr %agg.tmp6.sroa.3.0.agg.tmp67.sroa_idx, align 1
%agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx = getelementptr inbounds i8, ptr %agg.tmp67, i64 24
store i64 %6, ptr %agg.tmp6.sroa.4.0.agg.tmp67.sroa_idx, align 1
%7 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationIndex, align 8
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%cmpz16.i = icmp eq i64 %7, 0
br i1 %cmpz16.i, label %leader.i, label %merge.i
leader.i: ; preds = %entry
call void @llvm.memcpy.p3.p0.i64(ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow.21, ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, i64 32, i1 false)
br label %merge.i
merge.i: ; preds = %leader.i, %entry
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call void @llvm.memcpy.p0.p3.i64(ptr noundef nonnull align 8 dereferenceable(32) %agg.tmp67, ptr addrspace(3) noundef align 16 dereferenceable(32) @ArgShadow.21, i64 32, i1 false)
tail call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz16.i, label %wg_leader.i, label %wg_cf.i
wg_leader.i: ; preds = %merge.i
%g.ascast.i = addrspacecast ptr %agg.tmp67 to ptr addrspace(4)
store ptr addrspace(4) %g.ascast.i, ptr addrspace(3) @GAsCast5, align 8
store i32 0, ptr addrspace(3) @GCnt5, align 4
br label %wg_cf.i
wg_cf.i: ; preds = %wg_leader.i, %merge.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%wg_val_g.ascast.i = load ptr addrspace(4), ptr addrspace(3) @GAsCast5, align 8
%8 = load i64, ptr addrspace(1) @__spirv_BuiltInLocalInvocationId, align 32
%9 = trunc i64 %4 to i32
br label %for.cond.i
for.cond.i: ; preds = %wg_cf12.i, %wg_cf.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz16.i, label %wg_leader5.i, label %wg_cf6.i
wg_leader5.i: ; preds = %for.cond.i
%10 = load i32, ptr addrspace(3) @GCnt5, align 4
%cmp.i = icmp slt i32 %10, 2
store i1 %cmp.i, ptr addrspace(3) @GCmp5, align 1
br label %wg_cf6.i
wg_cf6.i: ; preds = %wg_leader5.i, %for.cond.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%wg_val_cmp.i = load i1, ptr addrspace(3) @GCmp5, align 1
br i1 %wg_val_cmp.i, label %for.body.i, label %lexit20
for.body.i: ; preds = %wg_cf6.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz16.i, label %TestMat.i, label %LeaderMat.i
TestMat.i: ; preds = %for.body.i
store ptr addrspace(4) %wg_val_g.ascast.i, ptr addrspace(3) @WGCopy.20.0, align 8
store ptr addrspace(4) addrspacecast (ptr addrspace(3) @GKernel4 to ptr addrspace(4)), ptr addrspace(3) @WGCopy.20.1, align 8
store i64 5, ptr addrspace(3) @WGCopy.19.0, align 8
br label %LeaderMat.i
LeaderMat.i: ; preds = %TestMat.i, %for.body.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
%11 = load i64, ptr addrspace(3) @WGCopy.19.0, align 8
%agg.tmp2.i.sroa.0.0.copyload = load ptr addrspace(4), ptr addrspace(3) @WGCopy.20.0, align 8
%agg.tmp2.i.sroa.6.0.copyload = load ptr addrspace(4), ptr addrspace(3) @WGCopy.20.1, align 8
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
%index.i.i.i.i.i = getelementptr inbounds i8, ptr addrspace(4) %agg.tmp2.i.sroa.0.0.copyload, i64 24
%12 = getelementptr inbounds i8, ptr addrspace(4) %agg.tmp2.i.sroa.6.0.copyload, i64 24
%13 = trunc i64 %11 to i32
br label %for.cond.i.i
for.cond.i.i: ; preds = %for.body.i.i, %LeaderMat.i
%storemerge.i.i = phi i64 [ %8, %LeaderMat.i ], [ %add.i.i, %for.body.i.i ]
%cmp.i.i = icmp ult i64 %storemerge.i.i, %11
br i1 %cmp.i.i, label %for.body.i.i, label %lexit21
for.body.i.i: ; preds = %for.cond.i.i
%14 = load i64, ptr addrspace(4) %index.i.i.i.i.i, align 8
%mul.i.i.i.i = mul i64 %14, 10
%mul3.i.i.i.i = shl i64 %storemerge.i.i, 1
%add.i.i.i.i = add i64 %mul.i.i.i.i, %mul3.i.i.i.i
%15 = load ptr addrspace(1), ptr addrspace(4) %12, align 8
%arrayidx.i.i.i.i.i = getelementptr inbounds i32, ptr addrspace(1) %15, i64 %add.i.i.i.i
%16 = load i32, ptr addrspace(1) %arrayidx.i.i.i.i.i, align 4
%conv9.i.i.i.i = add i32 %16, %13
store i32 %conv9.i.i.i.i, ptr addrspace(1) %arrayidx.i.i.i.i.i, align 4
%add14.i.i.i.i = or disjoint i64 %add.i.i.i.i, 1
%17 = load ptr addrspace(1), ptr addrspace(4) %12, align 8
%arrayidx.i25.i.i.i.i = getelementptr inbounds i32, ptr addrspace(1) %17, i64 %add14.i.i.i.i
%18 = load i32, ptr addrspace(1) %arrayidx.i25.i.i.i.i, align 4
%conv18.i.i.i.i = add i32 %18, %9
store i32 %conv18.i.i.i.i, ptr addrspace(1) %arrayidx.i25.i.i.i.i, align 4
%add.i.i = add i64 %storemerge.i.i, %4
br label %for.cond.i.i
lexit21: ; preds = %for.cond.i.i
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 noundef 2, i32 noundef 2, i32 noundef 272)
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br i1 %cmpz16.i, label %wg_leader11.i, label %wg_cf12.i
wg_leader11.i: ; preds = %lexit21
%19 = load i32, ptr addrspace(3) @GCnt5, align 4
%inc.i = add nsw i32 %19, 1
store i32 %inc.i, ptr addrspace(3) @GCnt5, align 4
br label %wg_cf12.i
wg_cf12.i: ; preds = %wg_leader11.i, %lexit21
call spir_func void @_Z22__spirv_ControlBarrierjjj(i32 2, i32 2, i32 272)
br label %for.cond.i
lexit20: ; preds = %wg_cf6.i
call void @llvm.lifetime.end.p0(i64 32, ptr nonnull %agg.tmp67)
ret void
}