| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py |
| ; RUN: opt -loop-idiom < %s -S | FileCheck %s |
| |
| %struct.S = type { i32, i32, i8 } |
| |
| ; unsigned copy_noalias(S* __restrict a, S *b, int n) { |
| ; for (int i = 0; i < n; i++) { |
| ; a[i] = b[i]; |
| ; } |
| ; return sizeof(a[0]); |
| ; } |
| |
| ; Function Attrs: nofree nounwind uwtable mustprogress |
| define dso_local i32 @copy_noalias(%struct.S* noalias nocapture %a, %struct.S* nocapture readonly %b, i32 %n) local_unnamed_addr #0 { |
| ; CHECK-LABEL: @copy_noalias( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[A1:%.*]] = bitcast %struct.S* [[A:%.*]] to i8* |
| ; CHECK-NEXT: [[B2:%.*]] = bitcast %struct.S* [[B:%.*]] to i8* |
| ; CHECK-NEXT: [[CMP7:%.*]] = icmp sgt i32 [[N:%.*]], 0 |
| ; CHECK-NEXT: br i1 [[CMP7]], label [[FOR_BODY_PREHEADER:%.*]], label [[FOR_COND_CLEANUP:%.*]] |
| ; CHECK: for.body.preheader: |
| ; CHECK-NEXT: [[TMP0:%.*]] = zext i32 [[N]] to i64 |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw nsw i64 [[TMP0]], 12 |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 4 [[A1]], i8* align 4 [[B2]], i64 [[TMP1]], i1 false) |
| ; CHECK-NEXT: br label [[FOR_BODY:%.*]] |
| ; CHECK: for.cond.cleanup.loopexit: |
| ; CHECK-NEXT: br label [[FOR_COND_CLEANUP]] |
| ; CHECK: for.cond.cleanup: |
| ; CHECK-NEXT: ret i32 12 |
| ; CHECK: for.body: |
| ; CHECK-NEXT: [[I_08:%.*]] = phi i32 [ [[INC:%.*]], [[FOR_BODY]] ], [ 0, [[FOR_BODY_PREHEADER]] ] |
| ; CHECK-NEXT: [[IDXPROM:%.*]] = zext i32 [[I_08]] to i64 |
| ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds [[STRUCT_S:%.*]], %struct.S* [[B]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds [[STRUCT_S]], %struct.S* [[A]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[TMP2:%.*]] = bitcast %struct.S* [[ARRAYIDX2]] to i8* |
| ; CHECK-NEXT: [[TMP3:%.*]] = bitcast %struct.S* [[ARRAYIDX]] to i8* |
| ; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[I_08]], 1 |
| ; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[INC]], [[N]] |
| ; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_COND_CLEANUP_LOOPEXIT:%.*]] |
| ; |
| entry: |
| %cmp7 = icmp sgt i32 %n, 0 |
| br i1 %cmp7, label %for.body.preheader, label %for.cond.cleanup |
| |
| for.body.preheader: ; preds = %entry |
| br label %for.body |
| |
| for.cond.cleanup.loopexit: ; preds = %for.body |
| br label %for.cond.cleanup |
| |
| for.cond.cleanup: ; preds = %for.cond.cleanup.loopexit, %entry |
| ret i32 12 |
| |
| for.body: ; preds = %for.body.preheader, %for.body |
| %i.08 = phi i32 [ %inc, %for.body ], [ 0, %for.body.preheader ] |
| %idxprom = zext i32 %i.08 to i64 |
| %arrayidx = getelementptr inbounds %struct.S, %struct.S* %b, i64 %idxprom |
| %arrayidx2 = getelementptr inbounds %struct.S, %struct.S* %a, i64 %idxprom |
| %0 = bitcast %struct.S* %arrayidx2 to i8* |
| %1 = bitcast %struct.S* %arrayidx to i8* |
| call void @llvm.memcpy.p0i8.p0i8.i64(i8* nonnull align 4 dereferenceable(12) %0, i8* nonnull align 4 dereferenceable(12) %1, i64 12, i1 false) |
| %inc = add nuw nsw i32 %i.08, 1 |
| %cmp = icmp slt i32 %inc, %n |
| br i1 %cmp, label %for.body, label %for.cond.cleanup.loopexit |
| } |
| |
| ; unsigned copy_may_alias(S *a, S *b, int n) { |
| ; for (int i = 0; i < n; i++) { |
| ; a[i] = b[i]; |
| ; } |
| ; return sizeof(a[0]); |
| ; } |
| |
| ; Function Attrs: nofree nounwind uwtable mustprogress |
| define dso_local i32 @copy_may_alias(%struct.S* nocapture %a, %struct.S* nocapture readonly %b, i32 %n) local_unnamed_addr #0 { |
| ; CHECK-LABEL: @copy_may_alias( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[CMP7:%.*]] = icmp sgt i32 [[N:%.*]], 0 |
| ; CHECK-NEXT: br i1 [[CMP7]], label [[FOR_BODY_PREHEADER:%.*]], label [[FOR_COND_CLEANUP:%.*]] |
| ; CHECK: for.body.preheader: |
| ; CHECK-NEXT: br label [[FOR_BODY:%.*]] |
| ; CHECK: for.cond.cleanup.loopexit: |
| ; CHECK-NEXT: br label [[FOR_COND_CLEANUP]] |
| ; CHECK: for.cond.cleanup: |
| ; CHECK-NEXT: ret i32 12 |
| ; CHECK: for.body: |
| ; CHECK-NEXT: [[I_08:%.*]] = phi i32 [ [[INC:%.*]], [[FOR_BODY]] ], [ 0, [[FOR_BODY_PREHEADER]] ] |
| ; CHECK-NEXT: [[IDXPROM:%.*]] = zext i32 [[I_08]] to i64 |
| ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds [[STRUCT_S:%.*]], %struct.S* [[B:%.*]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds [[STRUCT_S]], %struct.S* [[A:%.*]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[TMP0:%.*]] = bitcast %struct.S* [[ARRAYIDX2]] to i8* |
| ; CHECK-NEXT: [[TMP1:%.*]] = bitcast %struct.S* [[ARRAYIDX]] to i8* |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* nonnull align 4 dereferenceable(12) [[TMP0]], i8* nonnull align 4 dereferenceable(12) [[TMP1]], i64 12, i1 false) |
| ; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[I_08]], 1 |
| ; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[INC]], [[N]] |
| ; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_COND_CLEANUP_LOOPEXIT:%.*]] |
| ; |
| entry: |
| %cmp7 = icmp sgt i32 %n, 0 |
| br i1 %cmp7, label %for.body.preheader, label %for.cond.cleanup |
| |
| for.body.preheader: ; preds = %entry |
| br label %for.body |
| |
| for.cond.cleanup.loopexit: ; preds = %for.body |
| br label %for.cond.cleanup |
| |
| for.cond.cleanup: ; preds = %for.cond.cleanup.loopexit, %entry |
| ret i32 12 |
| |
| for.body: ; preds = %for.body.preheader, %for.body |
| %i.08 = phi i32 [ %inc, %for.body ], [ 0, %for.body.preheader ] |
| %idxprom = zext i32 %i.08 to i64 |
| %arrayidx = getelementptr inbounds %struct.S, %struct.S* %b, i64 %idxprom |
| %arrayidx2 = getelementptr inbounds %struct.S, %struct.S* %a, i64 %idxprom |
| %0 = bitcast %struct.S* %arrayidx2 to i8* |
| %1 = bitcast %struct.S* %arrayidx to i8* |
| call void @llvm.memcpy.p0i8.p0i8.i64(i8* nonnull align 4 dereferenceable(12) %0, i8* nonnull align 4 dereferenceable(12) %1, i64 12, i1 false) |
| %inc = add nuw nsw i32 %i.08, 1 |
| %cmp = icmp slt i32 %inc, %n |
| br i1 %cmp, label %for.body, label %for.cond.cleanup.loopexit |
| } |
| |
| %struct.R = type <{ i8, i32, i8 }> |
| |
| ; void copy_noalias_read(S* __restrict x, S* __restrict y, int n, int &s) { |
| ; for (int i = 0; i < n; i++) { |
| ; x[i] = y[i]; |
| ; s += y[i].b; |
| ; } |
| ; } |
| |
| ; Function Attrs: nofree nounwind uwtable mustprogress |
| define dso_local void @copy_noalias_read(%struct.R* noalias nocapture %x, %struct.R* noalias nocapture readonly %y, i32 %n, i32* nocapture nonnull align 4 dereferenceable(4) %s) local_unnamed_addr #0 { |
| ; CHECK-LABEL: @copy_noalias_read( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[X1:%.*]] = bitcast %struct.R* [[X:%.*]] to i8* |
| ; CHECK-NEXT: [[Y2:%.*]] = bitcast %struct.R* [[Y:%.*]] to i8* |
| ; CHECK-NEXT: [[CMP11:%.*]] = icmp sgt i32 [[N:%.*]], 0 |
| ; CHECK-NEXT: br i1 [[CMP11]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_COND_CLEANUP:%.*]] |
| ; CHECK: for.body.lr.ph: |
| ; CHECK-NEXT: [[S_PROMOTED:%.*]] = load i32, i32* [[S:%.*]], align 4 |
| ; CHECK-NEXT: [[TMP0:%.*]] = zext i32 [[N]] to i64 |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw nsw i64 [[TMP0]], 6 |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 [[X1]], i8* align 1 [[Y2]], i64 [[TMP1]], i1 false) |
| ; CHECK-NEXT: br label [[FOR_BODY:%.*]] |
| ; CHECK: for.cond.for.cond.cleanup_crit_edge: |
| ; CHECK-NEXT: [[ADD_LCSSA:%.*]] = phi i32 [ [[ADD:%.*]], [[FOR_BODY]] ] |
| ; CHECK-NEXT: store i32 [[ADD_LCSSA]], i32* [[S]], align 4 |
| ; CHECK-NEXT: br label [[FOR_COND_CLEANUP]] |
| ; CHECK: for.cond.cleanup: |
| ; CHECK-NEXT: ret void |
| ; CHECK: for.body: |
| ; CHECK-NEXT: [[ADD13:%.*]] = phi i32 [ [[S_PROMOTED]], [[FOR_BODY_LR_PH]] ], [ [[ADD]], [[FOR_BODY]] ] |
| ; CHECK-NEXT: [[I_012:%.*]] = phi i32 [ 0, [[FOR_BODY_LR_PH]] ], [ [[INC:%.*]], [[FOR_BODY]] ] |
| ; CHECK-NEXT: [[IDXPROM:%.*]] = zext i32 [[I_012]] to i64 |
| ; CHECK-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[STRUCT_R:%.*]], %struct.R* [[X]], i64 [[IDXPROM]], i32 0 |
| ; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[STRUCT_R]], %struct.R* [[Y]], i64 [[IDXPROM]], i32 0 |
| ; CHECK-NEXT: [[B:%.*]] = getelementptr inbounds [[STRUCT_R]], %struct.R* [[Y]], i64 [[IDXPROM]], i32 1 |
| ; CHECK-NEXT: [[TMP4:%.*]] = load i32, i32* [[B]], align 1 |
| ; CHECK-NEXT: [[ADD]] = add nsw i32 [[ADD13]], [[TMP4]] |
| ; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[I_012]], 1 |
| ; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[INC]], [[N]] |
| ; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_COND_FOR_COND_CLEANUP_CRIT_EDGE:%.*]] |
| ; |
| entry: |
| %cmp11 = icmp sgt i32 %n, 0 |
| br i1 %cmp11, label %for.body.lr.ph, label %for.cond.cleanup |
| |
| for.body.lr.ph: ; preds = %entry |
| %s.promoted = load i32, i32* %s, align 4 |
| br label %for.body |
| |
| for.cond.for.cond.cleanup_crit_edge: ; preds = %for.body |
| %add.lcssa = phi i32 [ %add, %for.body ] |
| store i32 %add.lcssa, i32* %s, align 4 |
| br label %for.cond.cleanup |
| |
| for.cond.cleanup: ; preds = %for.cond.for.cond.cleanup_crit_edge, %entry |
| ret void |
| |
| for.body: ; preds = %for.body.lr.ph, %for.body |
| %add13 = phi i32 [ %s.promoted, %for.body.lr.ph ], [ %add, %for.body ] |
| %i.012 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.body ] |
| %idxprom = zext i32 %i.012 to i64 |
| %0 = getelementptr inbounds %struct.R, %struct.R* %x, i64 %idxprom, i32 0 |
| %1 = getelementptr inbounds %struct.R, %struct.R* %y, i64 %idxprom, i32 0 |
| call void @llvm.memcpy.p0i8.p0i8.i64(i8* nonnull align 1 dereferenceable(6) %0, i8* nonnull align 1 dereferenceable(6) %1, i64 6, i1 false) |
| %b = getelementptr inbounds %struct.R, %struct.R* %y, i64 %idxprom, i32 1 |
| %2 = load i32, i32* %b, align 1 |
| %add = add nsw i32 %add13, %2 |
| %inc = add nuw nsw i32 %i.012, 1 |
| %cmp = icmp slt i32 %inc, %n |
| br i1 %cmp, label %for.body, label %for.cond.for.cond.cleanup_crit_edge |
| } |
| |
| ; unsigned copy_noalias_negative_stride(S* __restrict__ a, S* b, int n) { |
| ; for (int i = n; i >= 0; i--) { |
| ; a[i] = b[i]; |
| ; } |
| ; return sizeof(a[0]); |
| ; } |
| |
| ; Function Attrs: nofree nosync nounwind uwtable mustprogress |
| define dso_local i32 @copy_noalias_negative_stride(%struct.S* noalias nocapture %0, %struct.S* nocapture readonly %1, i32 %2) local_unnamed_addr #0 { |
| ; CHECK-LABEL: @copy_noalias_negative_stride( |
| ; CHECK-NEXT: [[TMP4:%.*]] = bitcast %struct.S* [[TMP0:%.*]] to i8* |
| ; CHECK-NEXT: [[TMP5:%.*]] = bitcast %struct.S* [[TMP1:%.*]] to i8* |
| ; CHECK-NEXT: [[TMP6:%.*]] = icmp sgt i32 [[TMP2:%.*]], -1 |
| ; CHECK-NEXT: br i1 [[TMP6]], label [[TMP7:%.*]], label [[TMP12:%.*]] |
| ; CHECK: 7: |
| ; CHECK-NEXT: [[TMP8:%.*]] = zext i32 [[TMP2]] to i64 |
| ; CHECK-NEXT: [[TMP9:%.*]] = mul nuw nsw i64 [[TMP8]], 12 |
| ; CHECK-NEXT: [[TMP10:%.*]] = add nuw nsw i64 [[TMP9]], 12 |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 4 [[TMP4]], i8* align 4 [[TMP5]], i64 [[TMP10]], i1 false) |
| ; CHECK-NEXT: br label [[TMP13:%.*]] |
| ; CHECK: 11: |
| ; CHECK-NEXT: br label [[TMP12]] |
| ; CHECK: 12: |
| ; CHECK-NEXT: ret i32 12 |
| ; CHECK: 13: |
| ; CHECK-NEXT: [[TMP14:%.*]] = phi i32 [ [[TMP20:%.*]], [[TMP13]] ], [ [[TMP2]], [[TMP7]] ] |
| ; CHECK-NEXT: [[TMP15:%.*]] = zext i32 [[TMP14]] to i64 |
| ; CHECK-NEXT: [[TMP16:%.*]] = getelementptr inbounds [[STRUCT_S:%.*]], %struct.S* [[TMP1]], i64 [[TMP15]] |
| ; CHECK-NEXT: [[TMP17:%.*]] = getelementptr inbounds [[STRUCT_S]], %struct.S* [[TMP0]], i64 [[TMP15]] |
| ; CHECK-NEXT: [[TMP18:%.*]] = bitcast %struct.S* [[TMP17]] to i8* |
| ; CHECK-NEXT: [[TMP19:%.*]] = bitcast %struct.S* [[TMP16]] to i8* |
| ; CHECK-NEXT: [[TMP20]] = add nsw i32 [[TMP14]], -1 |
| ; CHECK-NEXT: [[TMP21:%.*]] = icmp sgt i32 [[TMP14]], 0 |
| ; CHECK-NEXT: br i1 [[TMP21]], label [[TMP13]], label [[TMP11:%.*]] |
| ; |
| %4 = icmp sgt i32 %2, -1 |
| br i1 %4, label %5, label %7 |
| |
| 5: ; preds = %3 |
| br label %8 |
| |
| 6: ; preds = %8 |
| br label %7 |
| |
| 7: ; preds = %6, %3 |
| ret i32 12 |
| |
| 8: ; preds = %5, %8 |
| %9 = phi i32 [ %15, %8 ], [ %2, %5 ] |
| %10 = zext i32 %9 to i64 |
| %11 = getelementptr inbounds %struct.S, %struct.S* %1, i64 %10 |
| %12 = getelementptr inbounds %struct.S, %struct.S* %0, i64 %10 |
| %13 = bitcast %struct.S* %12 to i8* |
| %14 = bitcast %struct.S* %11 to i8* |
| tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* noundef nonnull align 4 dereferenceable(12) %13, i8* noundef nonnull align 4 dereferenceable(12) %14, i64 12, i1 false) |
| %15 = add nsw i32 %9, -1 |
| %16 = icmp sgt i32 %9, 0 |
| br i1 %16, label %8, label %6 |
| } |
| |
| ; unsigned copy_noalias_opposite_stride(S* __restrict__ a, S* b, int n) { |
| ; for (int i = 0, j = n; i < n && j >= 0; i++, j--) { |
| ; a[i] = b[j]; |
| ; } |
| ; return sizeof(a[0]); |
| ; } |
| |
| ; Function Attrs: nofree nosync nounwind uwtable mustprogress |
| define dso_local i32 @copy_noalias_opposite_stride(%struct.S* noalias nocapture %0, %struct.S* nocapture readonly %1, i32 %2) local_unnamed_addr #0 { |
| ; CHECK-LABEL: @copy_noalias_opposite_stride( |
| ; CHECK-NEXT: [[TMP4:%.*]] = icmp sgt i32 [[TMP2:%.*]], 0 |
| ; CHECK-NEXT: br i1 [[TMP4]], label [[TMP5:%.*]], label [[TMP7:%.*]] |
| ; CHECK: 5: |
| ; CHECK-NEXT: br label [[TMP8:%.*]] |
| ; CHECK: 6: |
| ; CHECK-NEXT: br label [[TMP7]] |
| ; CHECK: 7: |
| ; CHECK-NEXT: ret i32 12 |
| ; CHECK: 8: |
| ; CHECK-NEXT: [[TMP9:%.*]] = phi i32 [ [[TMP18:%.*]], [[TMP8]] ], [ [[TMP2]], [[TMP5]] ] |
| ; CHECK-NEXT: [[TMP10:%.*]] = phi i32 [ [[TMP17:%.*]], [[TMP8]] ], [ 0, [[TMP5]] ] |
| ; CHECK-NEXT: [[TMP11:%.*]] = zext i32 [[TMP9]] to i64 |
| ; CHECK-NEXT: [[TMP12:%.*]] = getelementptr inbounds [[STRUCT_S:%.*]], %struct.S* [[TMP1:%.*]], i64 [[TMP11]] |
| ; CHECK-NEXT: [[TMP13:%.*]] = zext i32 [[TMP10]] to i64 |
| ; CHECK-NEXT: [[TMP14:%.*]] = getelementptr inbounds [[STRUCT_S]], %struct.S* [[TMP0:%.*]], i64 [[TMP13]] |
| ; CHECK-NEXT: [[TMP15:%.*]] = bitcast %struct.S* [[TMP14]] to i8* |
| ; CHECK-NEXT: [[TMP16:%.*]] = bitcast %struct.S* [[TMP12]] to i8* |
| ; CHECK-NEXT: tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* noundef nonnull align 4 dereferenceable(12) [[TMP15]], i8* noundef nonnull align 4 dereferenceable(12) [[TMP16]], i64 12, i1 false) |
| ; CHECK-NEXT: [[TMP17]] = add nuw nsw i32 [[TMP10]], 1 |
| ; CHECK-NEXT: [[TMP18]] = add nsw i32 [[TMP9]], -1 |
| ; CHECK-NEXT: [[TMP19:%.*]] = icmp slt i32 [[TMP17]], [[TMP2]] |
| ; CHECK-NEXT: [[TMP20:%.*]] = icmp sgt i32 [[TMP9]], 0 |
| ; CHECK-NEXT: [[TMP21:%.*]] = and i1 [[TMP19]], [[TMP20]] |
| ; CHECK-NEXT: br i1 [[TMP21]], label [[TMP8]], label [[TMP6:%.*]] |
| ; |
| %4 = icmp sgt i32 %2, 0 |
| br i1 %4, label %5, label %7 |
| |
| 5: ; preds = %3 |
| br label %8 |
| |
| 6: ; preds = %8 |
| br label %7 |
| |
| 7: ; preds = %6, %3 |
| ret i32 12 |
| |
| 8: ; preds = %5, %8 |
| %9 = phi i32 [ %18, %8 ], [ %2, %5 ] |
| %10 = phi i32 [ %17, %8 ], [ 0, %5 ] |
| %11 = zext i32 %9 to i64 |
| %12 = getelementptr inbounds %struct.S, %struct.S* %1, i64 %11 |
| %13 = zext i32 %10 to i64 |
| %14 = getelementptr inbounds %struct.S, %struct.S* %0, i64 %13 |
| %15 = bitcast %struct.S* %14 to i8* |
| %16 = bitcast %struct.S* %12 to i8* |
| tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* noundef nonnull align 4 dereferenceable(12) %15, i8* noundef nonnull align 4 dereferenceable(12) %16, i64 12, i1 false) |
| %17 = add nuw nsw i32 %10, 1 |
| %18 = add nsw i32 %9, -1 |
| %19 = icmp slt i32 %17, %2 |
| %20 = icmp sgt i32 %9, 0 |
| %21 = and i1 %19, %20 |
| br i1 %21, label %8, label %6 |
| } |
| |
| %struct.SPacked = type <{ i32, i32, i8 }> |
| |
| ; Function Attrs: nofree nounwind uwtable mustprogress |
| define dso_local i32 @copy_noalias_packed(%struct.SPacked* noalias nocapture %a, %struct.SPacked* nocapture readonly %b, i32 %n) local_unnamed_addr #0 { |
| ; CHECK-LABEL: @copy_noalias_packed( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[A1:%.*]] = bitcast %struct.SPacked* [[A:%.*]] to i8* |
| ; CHECK-NEXT: [[B2:%.*]] = bitcast %struct.SPacked* [[B:%.*]] to i8* |
| ; CHECK-NEXT: [[CMP7:%.*]] = icmp sgt i32 [[N:%.*]], 0 |
| ; CHECK-NEXT: br i1 [[CMP7]], label [[FOR_BODY_PREHEADER:%.*]], label [[FOR_COND_CLEANUP:%.*]] |
| ; CHECK: for.body.preheader: |
| ; CHECK-NEXT: [[TMP0:%.*]] = zext i32 [[N]] to i64 |
| ; CHECK-NEXT: [[TMP1:%.*]] = mul nuw nsw i64 [[TMP0]], 9 |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 1 [[A1]], i8* align 1 [[B2]], i64 [[TMP1]], i1 false) |
| ; CHECK-NEXT: br label [[FOR_BODY:%.*]] |
| ; CHECK: for.cond.cleanup.loopexit: |
| ; CHECK-NEXT: br label [[FOR_COND_CLEANUP]] |
| ; CHECK: for.cond.cleanup: |
| ; CHECK-NEXT: ret i32 9 |
| ; CHECK: for.body: |
| ; CHECK-NEXT: [[I_08:%.*]] = phi i32 [ [[INC:%.*]], [[FOR_BODY]] ], [ 0, [[FOR_BODY_PREHEADER]] ] |
| ; CHECK-NEXT: [[IDXPROM:%.*]] = zext i32 [[I_08]] to i64 |
| ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds [[STRUCT_SPACKED:%.*]], %struct.SPacked* [[B]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds [[STRUCT_SPACKED]], %struct.SPacked* [[A]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[TMP2:%.*]] = bitcast %struct.SPacked* [[ARRAYIDX2]] to i8* |
| ; CHECK-NEXT: [[TMP3:%.*]] = bitcast %struct.SPacked* [[ARRAYIDX]] to i8* |
| ; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[I_08]], 1 |
| ; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[INC]], [[N]] |
| ; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_COND_CLEANUP_LOOPEXIT:%.*]] |
| ; |
| entry: |
| %cmp7 = icmp sgt i32 %n, 0 |
| br i1 %cmp7, label %for.body.preheader, label %for.cond.cleanup |
| |
| for.body.preheader: ; preds = %entry |
| br label %for.body |
| |
| for.cond.cleanup.loopexit: ; preds = %for.body |
| br label %for.cond.cleanup |
| |
| for.cond.cleanup: ; preds = %for.cond.cleanup.loopexit, %entry |
| ret i32 9 |
| |
| for.body: ; preds = %for.body.preheader, %for.body |
| %i.08 = phi i32 [ %inc, %for.body ], [ 0, %for.body.preheader ] |
| %idxprom = zext i32 %i.08 to i64 |
| %arrayidx = getelementptr inbounds %struct.SPacked, %struct.SPacked* %b, i64 %idxprom |
| %arrayidx2 = getelementptr inbounds %struct.SPacked, %struct.SPacked* %a, i64 %idxprom |
| %0 = bitcast %struct.SPacked* %arrayidx2 to i8* |
| %1 = bitcast %struct.SPacked* %arrayidx to i8* |
| call void @llvm.memcpy.p0i8.p0i8.i64(i8* nonnull align 1 dereferenceable(9) %0, i8* nonnull align 1 dereferenceable(9) %1, i64 9, i1 false) |
| %inc = add nuw nsw i32 %i.08, 1 |
| %cmp = icmp slt i32 %inc, %n |
| br i1 %cmp, label %for.body, label %for.cond.cleanup.loopexit |
| } |
| |
| %struct.SAligned = type { i32, i32, i8, [7 x i8] } |
| |
| define dso_local i32 @copy_noalias_aligned(%struct.SAligned* noalias nocapture %a, %struct.SAligned* nocapture readonly %b, i32 %n) local_unnamed_addr #0 { |
| ; CHECK-LABEL: @copy_noalias_aligned( |
| ; CHECK-NEXT: entry: |
| ; CHECK-NEXT: [[A1:%.*]] = bitcast %struct.SAligned* [[A:%.*]] to i8* |
| ; CHECK-NEXT: [[B2:%.*]] = bitcast %struct.SAligned* [[B:%.*]] to i8* |
| ; CHECK-NEXT: [[CMP7:%.*]] = icmp sgt i32 [[N:%.*]], 0 |
| ; CHECK-NEXT: br i1 [[CMP7]], label [[FOR_BODY_PREHEADER:%.*]], label [[FOR_COND_CLEANUP:%.*]] |
| ; CHECK: for.body.preheader: |
| ; CHECK-NEXT: [[TMP0:%.*]] = zext i32 [[N]] to i64 |
| ; CHECK-NEXT: [[TMP1:%.*]] = shl nuw nsw i64 [[TMP0]], 4 |
| ; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 16 [[A1]], i8* align 16 [[B2]], i64 [[TMP1]], i1 false) |
| ; CHECK-NEXT: br label [[FOR_BODY:%.*]] |
| ; CHECK: for.cond.cleanup.loopexit: |
| ; CHECK-NEXT: br label [[FOR_COND_CLEANUP]] |
| ; CHECK: for.cond.cleanup: |
| ; CHECK-NEXT: ret i32 16 |
| ; CHECK: for.body: |
| ; CHECK-NEXT: [[I_08:%.*]] = phi i32 [ [[INC:%.*]], [[FOR_BODY]] ], [ 0, [[FOR_BODY_PREHEADER]] ] |
| ; CHECK-NEXT: [[IDXPROM:%.*]] = zext i32 [[I_08]] to i64 |
| ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds [[STRUCT_SALIGNED:%.*]], %struct.SAligned* [[B]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds [[STRUCT_SALIGNED]], %struct.SAligned* [[A]], i64 [[IDXPROM]] |
| ; CHECK-NEXT: [[TMP2:%.*]] = bitcast %struct.SAligned* [[ARRAYIDX2]] to i8* |
| ; CHECK-NEXT: [[TMP3:%.*]] = bitcast %struct.SAligned* [[ARRAYIDX]] to i8* |
| ; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[I_08]], 1 |
| ; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[INC]], [[N]] |
| ; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_COND_CLEANUP_LOOPEXIT:%.*]] |
| ; |
| entry: |
| %cmp7 = icmp sgt i32 %n, 0 |
| br i1 %cmp7, label %for.body.preheader, label %for.cond.cleanup |
| |
| for.body.preheader: ; preds = %entry |
| br label %for.body |
| |
| for.cond.cleanup.loopexit: ; preds = %for.body |
| br label %for.cond.cleanup |
| |
| for.cond.cleanup: ; preds = %for.cond.cleanup.loopexit, %entry |
| ret i32 16 |
| |
| for.body: ; preds = %for.body.preheader, %for.body |
| %i.08 = phi i32 [ %inc, %for.body ], [ 0, %for.body.preheader ] |
| %idxprom = zext i32 %i.08 to i64 |
| %arrayidx = getelementptr inbounds %struct.SAligned, %struct.SAligned* %b, i64 %idxprom |
| %arrayidx2 = getelementptr inbounds %struct.SAligned, %struct.SAligned* %a, i64 %idxprom |
| %0 = bitcast %struct.SAligned* %arrayidx2 to i8* |
| %1 = bitcast %struct.SAligned* %arrayidx to i8* |
| call void @llvm.memcpy.p0i8.p0i8.i64(i8* nonnull align 16 dereferenceable(16) %0, i8* nonnull align 16 dereferenceable(16) %1, i64 16, i1 false) |
| %inc = add nuw nsw i32 %i.08, 1 |
| %cmp = icmp slt i32 %inc, %n |
| br i1 %cmp, label %for.body, label %for.cond.cleanup.loopexit |
| } |
| |
| ; Function Attrs: argmemonly nofree nosync nounwind willreturn |
| declare void @llvm.memcpy.p0i8.p0i8.i64(i8* noalias nocapture writeonly, i8* noalias nocapture readonly, i64, i1 immarg) #1 |