| ; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \ |
| ; RUN: -enable-ppc-quad-precision -verify-machineinstrs < %s | FileCheck %s |
| ; RUN: llc -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown \ |
| ; RUN: -enable-ppc-quad-precision -verify-machineinstrs < %s \ |
| ; RUN: | FileCheck -check-prefix=CHECK-BE %s |
| |
| ; Testing homogeneous aggregates. |
| |
| %struct.With9fp128params = type { fp128, fp128, fp128, fp128, fp128, fp128, |
| fp128, fp128, fp128 } |
| |
| @a1 = common local_unnamed_addr global [3 x fp128] zeroinitializer, align 16 |
| |
| ; Function Attrs: norecurse nounwind readonly |
| define fp128 @testArray_01(fp128* nocapture readonly %sa) { |
| ; CHECK-LABEL: testArray_01: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: lxv 34, 32(3) |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testArray_01: |
| ; CHECK-BE: lxv 34, 32(3) |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %arrayidx = getelementptr inbounds fp128, fp128* %sa, i64 2 |
| %0 = load fp128, fp128* %arrayidx, align 16 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readonly |
| define fp128 @testArray_02() { |
| ; CHECK-LABEL: testArray_02: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: addis 3, 2, .LC0@toc@ha |
| ; CHECK-NEXT: ld 3, .LC0@toc@l(3) |
| ; CHECK-NEXT: lxv 34, 32(3) |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testArray_02: |
| ; CHECK-BE: lxv 34, 32(3) |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %0 = load fp128, fp128* getelementptr inbounds ([3 x fp128], [3 x fp128]* @a1, |
| i64 0, i64 2), align 16 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testStruct_01(fp128 inreg returned %a.coerce) { |
| ; CHECK-LABEL: testStruct_01: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testStruct_01: |
| ; CHECK-BE: # %bb.0: # %entry |
| ; CHECK-BE-NEXT: blr |
| entry: |
| ret fp128 %a.coerce |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testStruct_02([8 x fp128] %a.coerce) { |
| ; CHECK-LABEL: testStruct_02: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: vmr 2, 9 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testStruct_02: |
| ; CHECK-BE: vmr 2, 9 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.7.extract = extractvalue [8 x fp128] %a.coerce, 7 |
| ret fp128 %a.coerce.fca.7.extract |
| } |
| |
| ; Since we can only pass a max of 8 float128 value in VSX registers, ensure we |
| ; store to stack if passing more. |
| ; Function Attrs: norecurse nounwind readonly |
| define fp128 @testStruct_03(%struct.With9fp128params* byval nocapture readonly |
| align 16 %a) { |
| ; CHECK-LABEL: testStruct_03: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: lxv 34, 128(1) |
| ; CHECK-NEXT: std 10, 88(1) |
| ; CHECK-NEXT: std 9, 80(1) |
| ; CHECK-NEXT: std 8, 72(1) |
| ; CHECK-NEXT: std 7, 64(1) |
| ; CHECK-NEXT: std 6, 56(1) |
| ; CHECK-NEXT: std 5, 48(1) |
| ; CHECK-NEXT: std 4, 40(1) |
| ; CHECK-NEXT: std 3, 32(1) |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testStruct_03: |
| ; CHECK-BE: # %bb.0: # %entry |
| ; CHECK-BE-NEXT: lxv 34, 144(1) |
| ; CHECK-BE-NEXT: std 10, 104(1) |
| ; CHECK-BE-NEXT: std 9, 96(1) |
| ; CHECK-BE-NEXT: std 8, 88(1) |
| ; CHECK-BE-NEXT: std 7, 80(1) |
| ; CHECK-BE-NEXT: std 6, 72(1) |
| ; CHECK-BE-NEXT: std 5, 64(1) |
| ; CHECK-BE-NEXT: std 4, 56(1) |
| ; CHECK-BE-NEXT: std 3, 48(1) |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a7 = getelementptr inbounds %struct.With9fp128params, |
| %struct.With9fp128params* %a, i64 0, i32 6 |
| %0 = load fp128, fp128* %a7, align 16 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testStruct_04([8 x fp128] %a.coerce) { |
| ; CHECK-LABEL: testStruct_04: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: vmr 2, 5 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testStruct_04: |
| ; CHECK-BE: vmr 2, 5 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.3.extract = extractvalue [8 x fp128] %a.coerce, 3 |
| ret fp128 %a.coerce.fca.3.extract |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testHUnion_01([1 x fp128] %a.coerce) { |
| ; CHECK-LABEL: testHUnion_01: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testHUnion_01: |
| ; CHECK-BE: # %bb.0: # %entry |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.0.extract = extractvalue [1 x fp128] %a.coerce, 0 |
| ret fp128 %a.coerce.fca.0.extract |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testHUnion_02([3 x fp128] %a.coerce) { |
| ; CHECK-LABEL: testHUnion_02: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testHUnion_02: |
| ; CHECK-BE: # %bb.0: # %entry |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.0.extract = extractvalue [3 x fp128] %a.coerce, 0 |
| ret fp128 %a.coerce.fca.0.extract |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testHUnion_03([3 x fp128] %a.coerce) { |
| ; CHECK-LABEL: testHUnion_03: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: vmr 2, 3 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testHUnion_03: |
| ; CHECK-BE: # %bb.0: # %entry |
| ; CHECK-BE-NEXT: vmr 2, 3 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.1.extract = extractvalue [3 x fp128] %a.coerce, 1 |
| ret fp128 %a.coerce.fca.1.extract |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testHUnion_04([3 x fp128] %a.coerce) { |
| ; CHECK-LABEL: testHUnion_04: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: vmr 2, 4 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testHUnion_04: |
| ; CHECK-BE: # %bb.0: # %entry |
| ; CHECK-BE-NEXT: vmr 2, 4 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.2.extract = extractvalue [3 x fp128] %a.coerce, 2 |
| ret fp128 %a.coerce.fca.2.extract |
| } |
| |
| ; Testing mixed member aggregates. |
| |
| %struct.MixedC = type { i32, %struct.SA, float, [12 x i8] } |
| %struct.SA = type { double, fp128, <4 x float> } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testMixedAggregate([3 x i128] %a.coerce) { |
| ; CHECK-LABEL: testMixedAggregate: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: mtvsrdd 34, 8, 7 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testMixedAggregate: |
| ; CHECK-BE: mtvsrdd 34, 8, 7 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.2.extract = extractvalue [3 x i128] %a.coerce, 2 |
| %0 = bitcast i128 %a.coerce.fca.2.extract to fp128 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testMixedAggregate_02([4 x i128] %a.coerce) { |
| ; CHECK-LABEL: testMixedAggregate_02: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: mtvsrdd 34, 6, 5 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testMixedAggregate_02: |
| ; CHECK-BE: mtvsrdd 34, 6, 5 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.1.extract = extractvalue [4 x i128] %a.coerce, 1 |
| %0 = bitcast i128 %a.coerce.fca.1.extract to fp128 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testMixedAggregate_03([4 x i128] %sa.coerce) { |
| ; CHECK-LABEL: testMixedAggregate_03: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-DAG: mtvsrwa 34, 3 |
| ; CHECK-DAG: mtvsrdd 35, 6, 5 |
| ; CHECK: mtvsrd 36, 10 |
| ; CHECK: xscvsdqp 2, 2 |
| ; CHECK-DAG: xscvsdqp [[REG:[0-9]+]], 4 |
| ; CHECK-DAG: xsaddqp 2, 3, 2 |
| ; CHECK: xsaddqp 2, 2, [[REG]] |
| ; CHECK-NEXT: blr |
| entry: |
| %sa.coerce.fca.0.extract = extractvalue [4 x i128] %sa.coerce, 0 |
| %sa.sroa.0.0.extract.trunc = trunc i128 %sa.coerce.fca.0.extract to i32 |
| %sa.coerce.fca.1.extract = extractvalue [4 x i128] %sa.coerce, 1 |
| %sa.coerce.fca.3.extract = extractvalue [4 x i128] %sa.coerce, 3 |
| %sa.sroa.6.48.extract.shift = lshr i128 %sa.coerce.fca.3.extract, 64 |
| %sa.sroa.6.48.extract.trunc = trunc i128 %sa.sroa.6.48.extract.shift to i64 |
| %conv = sitofp i32 %sa.sroa.0.0.extract.trunc to fp128 |
| %0 = bitcast i128 %sa.coerce.fca.1.extract to fp128 |
| %add = fadd fp128 %0, %conv |
| %conv2 = sitofp i64 %sa.sroa.6.48.extract.trunc to fp128 |
| %add3 = fadd fp128 %add, %conv2 |
| ret fp128 %add3 |
| } |
| |
| |
| ; Function Attrs: norecurse nounwind readonly |
| define fp128 @testNestedAggregate(%struct.MixedC* byval nocapture readonly align 16 %a) { |
| ; CHECK-LABEL: testNestedAggregate: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: std 8, 72(1) |
| ; CHECK-NEXT: std 7, 64(1) |
| ; CHECK-NEXT: std 10, 88(1) |
| ; CHECK-NEXT: std 9, 80(1) |
| ; CHECK-NEXT: lxv 34, 64(1) |
| ; CHECK-NEXT: std 6, 56(1) |
| ; CHECK-NEXT: std 5, 48(1) |
| ; CHECK-NEXT: std 4, 40(1) |
| ; CHECK-NEXT: std 3, 32(1) |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testNestedAggregate: |
| ; CHECK-BE: # %bb.0: # %entry |
| ; CHECK-BE-NEXT: std 8, 88(1) |
| ; CHECK-BE-NEXT: std 7, 80(1) |
| ; CHECK-BE-NEXT: std 10, 104(1) |
| ; CHECK-BE-NEXT: std 9, 96(1) |
| ; CHECK-BE-NEXT: lxv 34, 80(1) |
| ; CHECK-BE-NEXT: std 6, 72(1) |
| ; CHECK-BE-NEXT: std 5, 64(1) |
| ; CHECK-BE-NEXT: std 4, 56(1) |
| ; CHECK-BE-NEXT: std 3, 48(1) |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %c = getelementptr inbounds %struct.MixedC, %struct.MixedC* %a, i64 0, i32 1, i32 1 |
| %0 = load fp128, fp128* %c, align 16 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testUnion_01([1 x i128] %a.coerce) { |
| ; CHECK-LABEL: testUnion_01: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: mtvsrdd 34, 4, 3 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testUnion_01: |
| ; CHECK-BE: mtvsrdd 34, 4, 3 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0 |
| %0 = bitcast i128 %a.coerce.fca.0.extract to fp128 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testUnion_02([1 x i128] %a.coerce) { |
| ; CHECK-LABEL: testUnion_02: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: mtvsrdd 34, 4, 3 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testUnion_02: |
| ; CHECK-BE: mtvsrdd 34, 4, 3 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0 |
| %0 = bitcast i128 %a.coerce.fca.0.extract to fp128 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: norecurse nounwind readnone |
| define fp128 @testUnion_03([4 x i128] %a.coerce) { |
| ; CHECK-LABEL: testUnion_03: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: mtvsrdd 34, 8, 7 |
| ; CHECK-NEXT: blr |
| |
| ; CHECK-BE-LABEL: testUnion_03: |
| ; CHECK-BE: mtvsrdd 34, 8, 7 |
| ; CHECK-BE-NEXT: blr |
| entry: |
| %a.coerce.fca.2.extract = extractvalue [4 x i128] %a.coerce, 2 |
| %0 = bitcast i128 %a.coerce.fca.2.extract to fp128 |
| ret fp128 %0 |
| } |
| |
| ; Function Attrs: nounwind |
| define fp128 @sum_float128(i32 signext %count, ...) { |
| ; CHECK-LABEL: sum_float128: |
| ; CHECK: # %bb.0: # %entry |
| ; CHECK-NEXT: addis 11, 2, .LCPI17_0@toc@ha |
| ; CHECK-NEXT: cmpwi 0, 3, 1 |
| ; CHECK-NEXT: std 10, 88(1) |
| ; CHECK-NEXT: std 9, 80(1) |
| ; CHECK-NEXT: std 8, 72(1) |
| ; CHECK-NEXT: std 7, 64(1) |
| ; CHECK-NEXT: std 6, 56(1) |
| ; CHECK-NEXT: std 5, 48(1) |
| ; CHECK-NEXT: std 4, 40(1) |
| ; CHECK-NEXT: addi 11, 11, .LCPI17_0@toc@l |
| ; CHECK-NEXT: lxvx 34, 0, 11 |
| ; CHECK-NEXT: bltlr 0 |
| ; CHECK-NEXT: # %bb.1: # %if.end |
| ; CHECK-NEXT: addi 3, 1, 40 |
| ; CHECK-NEXT: lxvx 35, 0, 3 |
| ; CHECK-NEXT: xsaddqp 2, 3, 2 |
| ; CHECK-NEXT: lxv 35, 16(3) |
| ; CHECK-NEXT: addi 3, 1, 72 |
| ; CHECK-NEXT: std 3, -8(1) |
| ; CHECK-NEXT: xsaddqp 2, 2, 3 |
| ; CHECK-NEXT: blr |
| entry: |
| %ap = alloca i8*, align 8 |
| %0 = bitcast i8** %ap to i8* |
| call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull %0) #2 |
| %cmp = icmp slt i32 %count, 1 |
| br i1 %cmp, label %cleanup, label %if.end |
| |
| if.end: ; preds = %entry |
| call void @llvm.va_start(i8* nonnull %0) |
| %argp.cur = load i8*, i8** %ap, align 8 |
| %argp.next = getelementptr inbounds i8, i8* %argp.cur, i64 16 |
| %1 = bitcast i8* %argp.cur to fp128* |
| %2 = load fp128, fp128* %1, align 8 |
| %add = fadd fp128 %2, 0xL00000000000000000000000000000000 |
| %argp.next3 = getelementptr inbounds i8, i8* %argp.cur, i64 32 |
| store i8* %argp.next3, i8** %ap, align 8 |
| %3 = bitcast i8* %argp.next to fp128* |
| %4 = load fp128, fp128* %3, align 8 |
| %add4 = fadd fp128 %add, %4 |
| call void @llvm.va_end(i8* nonnull %0) |
| br label %cleanup |
| |
| cleanup: ; preds = %entry, %if.end |
| %retval.0 = phi fp128 [ %add4, %if.end ], [ 0xL00000000000000000000000000000000, %entry ] |
| call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull %0) #2 |
| ret fp128 %retval.0 |
| } |
| |
| declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #1 |
| declare void @llvm.va_start(i8*) #2 |
| declare void @llvm.va_end(i8*) #2 |
| declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #1 |