| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \ |
| ; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names < %s \ |
| ; RUN: | FileCheck %s --check-prefixes=CHECK-S,CHECK-ALL |
| ; RUN: llc -verify-machineinstrs -target-abi=elfv2 -mtriple=powerpc64-- \ |
| ; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names < %s \ |
| ; RUN: | FileCheck %s --check-prefixes=CHECK-S,CHECK-ALL |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \ |
| ; RUN: -mcpu=pwr9 -ppc-asm-full-reg-names < %s \ |
| ; RUN: | FileCheck %s --check-prefixes=CHECK-P9,CHECK-ALL |
| ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \ |
| ; RUN: -mcpu=pwr9 --code-model=large -ppc-asm-full-reg-names < %s \ |
| ; RUN: | FileCheck %s --check-prefixes=CHECK-LARGE,CHECK-ALL |
| |
| @global_int = common dso_local local_unnamed_addr global i32 0, align 4 |
| |
| define dso_local signext i32 @NoTOC() local_unnamed_addr { |
| ; CHECK-ALL-LABEL: NoTOC: |
| ; CHECK-S-NOT: .localentry |
| ; CHECK-S: li r3, 42 |
| ; CHECK-S-NEXT: blr |
| entry: |
| ret i32 42 |
| } |
| |
| define dso_local signext i32 @AsmClobberX2(i32 signext %a, i32 signext %b) local_unnamed_addr { |
| ; CHECK-ALL-LABEL: AsmClobberX2: |
| ; CHECK-S: .localentry AsmClobberX2, 1 |
| ; CHECK-S: add r3, r4, r3 |
| ; CHECK-S: #APP |
| ; CHECK-S-NEXT: nop |
| ; CHECK-S-NEXT: #NO_APP |
| ; CHECK-S: blr |
| entry: |
| %add = add nsw i32 %b, %a |
| tail call void asm sideeffect "nop", "~{r2}"() |
| ret i32 %add |
| } |
| |
| ; FIXME: This is actually a test case that shows a bug. On power9 and earlier |
| ; this test should not compile. On later CPUs (like this test) the @toc |
| ; should be replaced with @pcrel and we won't need R2 and so the problem |
| ; goes away. |
| define dso_local signext i32 @AsmClobberX2WithTOC(i32 signext %a, i32 signext %b) local_unnamed_addr { |
| ; CHECK-ALL-LABEL: AsmClobberX2WithTOC: |
| ; CHECK-LARGE: ld r2, .Lfunc_toc2-.Lfunc_gep2(r12) |
| ; CHECK-LARGE: add r2, r2, r12 |
| ; CHECK-S: .localentry AsmClobberX2WithTOC |
| ; CHECK-S: #APP |
| ; CHECK-S-NEXT: li r2, 0 |
| ; CHECK-S-NEXT: #NO_APP |
| ; CHECK-S-NEXT: plwz r5, global_int@PCREL(0), 1 |
| ; CHECK-S-NEXT: add r3, r4, r3 |
| ; CHECK-S-NEXT: add r3, r3, r5 |
| ; CHECK-S-NEXT: extsw r3, r3 |
| ; CHECK-S-NEXT: blr |
| entry: |
| %add = add nsw i32 %b, %a |
| tail call void asm sideeffect "li 2, 0", "~{r2}"() |
| %0 = load i32, ptr @global_int, align 4 |
| %add1 = add nsw i32 %add, %0 |
| ret i32 %add1 |
| } |
| |
| define dso_local signext i32 @AsmClobberX5(i32 signext %a, i32 signext %b) local_unnamed_addr { |
| ; CHECK-ALL-LABEL: AsmClobberX5: |
| ; CHECK-S: .localentry AsmClobberX5, 1 |
| ; CHECK-P9-NOT: .localentry |
| ; CHECK-ALL: # %bb.0: # %entry |
| ; CHECK-S-NEXT: add r3, r4, r3 |
| ; CHECK-S-NEXT: #APP |
| ; CHECK-S-NEXT: nop |
| ; CHECK-S-NEXT: #NO_APP |
| ; CHECK-S-NEXT: extsw r3, r3 |
| ; CHECK-S-NEXT: blr |
| entry: |
| %add = add nsw i32 %b, %a |
| tail call void asm sideeffect "nop", "~{r5}"() |
| ret i32 %add |
| } |
| |
| ; Clobber all GPRs except R2. |
| define dso_local signext i32 @AsmClobberNotR2(i32 signext %a, i32 signext %b) local_unnamed_addr { |
| ; CHECK-ALL-LABEL: AsmClobberNotR2: |
| ; CHECK-S: .localentry AsmClobberNotR2, 1 |
| ; CHECK-P9-NOT: .localentry |
| ; CHECK-S: add r3, r4, r3 |
| ; CHECK-S: stw r3, -148(r1) # 4-byte Folded Spill |
| ; CHECK-S-NEXT: #APP |
| ; CHECK-S-NEXT: nop |
| ; CHECK-S-NEXT: #NO_APP |
| ; CHECK-S-NEXT: lwz r3, -148(r1) # 4-byte Folded Reload |
| ; CHECK-S: blr |
| entry: |
| %add = add nsw i32 %b, %a |
| tail call void asm sideeffect "nop", "~{r0},~{r1},~{r3},~{r4},~{r5},~{r6},~{r7},~{r8},~{r9},~{r10},~{r11},~{r12},~{r13},~{r14},~{r15},~{r16},~{r17},~{r18},~{r19},~{r20},~{r21},~{r22},~{r23},~{r24},~{r25},~{r26},~{r27},~{r28},~{r29},~{r30},~{r31}"() |
| ret i32 %add |
| } |
| |
| ; Increase register pressure enough to force the register allocator to |
| ; make use of R2. |
| define dso_local signext i32 @X2IsCallerSaved(i32 signext %a, i32 signext %b, i32 signext %c, i32 signext %d, i32 signext %e, i32 signext %f, i32 signext %g, i32 signext %h) local_unnamed_addr { |
| ; CHECK-ALL-LABEL: X2IsCallerSaved: |
| ; CHECK-S: .localentry X2IsCallerSaved, 1 |
| ; CHECK-P9-NOT: .localentry |
| ; CHECK-ALL: # %bb.0: # %entry |
| ; CHECK-S-NEXT: std r29, -24(r1) # 8-byte Folded Spill |
| ; CHECK-S-NEXT: std r30, -16(r1) # 8-byte Folded Spill |
| ; CHECK-S-NEXT: add r11, r4, r3 |
| ; CHECK-S-NEXT: sub r29, r8, r9 |
| ; CHECK-S-NEXT: add r9, r10, r9 |
| ; CHECK-S-NEXT: sub r10, r10, r3 |
| ; CHECK-S-NEXT: mullw r3, r4, r3 |
| ; CHECK-S-NEXT: sub r12, r4, r5 |
| ; CHECK-S-NEXT: add r0, r6, r5 |
| ; CHECK-S-NEXT: sub r2, r6, r7 |
| ; CHECK-S-NEXT: add r30, r8, r7 |
| ; CHECK-S-NEXT: mullw r3, r3, r11 |
| ; CHECK-S-NEXT: mullw r3, r3, r5 |
| ; CHECK-S-NEXT: mullw r3, r3, r6 |
| ; CHECK-S-NEXT: mullw r3, r3, r12 |
| ; CHECK-S-NEXT: mullw r3, r3, r0 |
| ; CHECK-S-NEXT: mullw r3, r3, r7 |
| ; CHECK-S-NEXT: mullw r3, r3, r8 |
| ; CHECK-S-NEXT: mullw r3, r3, r2 |
| ; CHECK-S-NEXT: mullw r3, r3, r30 |
| ; CHECK-S-NEXT: ld r30, -16(r1) # 8-byte Folded Reload |
| ; CHECK-S-NEXT: mullw r3, r3, r29 |
| ; CHECK-S-NEXT: ld r29, -24(r1) # 8-byte Folded Reload |
| ; CHECK-S-NEXT: mullw r3, r3, r9 |
| ; CHECK-S-NEXT: mullw r3, r3, r10 |
| ; CHECK-S-NEXT: extsw r3, r3 |
| ; CHECK-S-NEXT: blr |
| entry: |
| %add = add nsw i32 %b, %a |
| %sub = sub nsw i32 %b, %c |
| %add1 = add nsw i32 %d, %c |
| %sub2 = sub nsw i32 %d, %e |
| %add3 = add nsw i32 %f, %e |
| %sub4 = sub nsw i32 %f, %g |
| %add5 = add nsw i32 %h, %g |
| %sub6 = sub nsw i32 %h, %a |
| %mul = mul i32 %b, %a |
| %mul7 = mul i32 %mul, %add |
| %mul8 = mul i32 %mul7, %c |
| %mul9 = mul i32 %mul8, %d |
| %mul10 = mul i32 %mul9, %sub |
| %mul11 = mul i32 %mul10, %add1 |
| %mul12 = mul i32 %mul11, %e |
| %mul13 = mul i32 %mul12, %f |
| %mul14 = mul i32 %mul13, %sub2 |
| %mul15 = mul i32 %mul14, %add3 |
| %mul16 = mul i32 %mul15, %sub4 |
| %mul17 = mul i32 %mul16, %add5 |
| %mul18 = mul i32 %mul17, %sub6 |
| ret i32 %mul18 |
| } |
| |
| |
| define dso_local signext i32 @UsesX2AsTOC() local_unnamed_addr { |
| ; CHECK-ALL-LABEL: UsesX2AsTOC: |
| ; CHECK-LARGE: ld r2, .Lfunc_toc6-.Lfunc_gep6(r12) |
| ; CHECK-LARGE: add r2, r2, r12 |
| ; CHECK-ALL: # %bb.0: # %entry |
| entry: |
| %0 = load i32, ptr @global_int, align 4 |
| ret i32 %0 |
| } |
| |
| |
| define dso_local double @UsesX2AsConstPoolTOC() local_unnamed_addr { |
| ; CHECK-ALL-LABEL: UsesX2AsConstPoolTOC: |
| ; CHECK-LARGE: ld r2, .Lfunc_toc7-.Lfunc_gep7(r12) |
| ; CHECK-LARGE: add r2, r2, r12 |
| ; CHECK-S-NOT: .localentry |
| ; CHECK-ALL: # %bb.0: # %entry |
| ; CHECK-S-NEXT: xxsplti32dx vs1, 0, 1078011044 |
| ; CHECK-S-NEXT: xxsplti32dx vs1, 1, -337824948 |
| ; CHECK-S-NEXT: blr |
| entry: |
| ret double 0x404124A4EBDD334C |
| } |
| |
| |