; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \ ; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | \ ; RUN: FileCheck %s ; RUN: llc -verify-machineinstrs -target-abi=elfv2 -mtriple=powerpc64-- \ ; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | \ ; RUN: FileCheck %s ; The tests check the behaviour of PC Relative tail calls. When using ; PC Relative we are able to do more tail calling than we have done in ; the past as we no longer need to restore the TOC pointer into R2 after ; most calls. @Func = external local_unnamed_addr global i32 (...)*, align 8 @FuncLocal = common dso_local local_unnamed_addr global i32 (...)* null, align 8 ; No calls in this function but we assign the function pointers. define dso_local void @AssignFuncPtr() local_unnamed_addr { ; CHECK-LABEL: AssignFuncPtr: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: pld r3, Func@got@pcrel(0), 1 ; CHECK-NEXT: pld r4, Function@got@pcrel(0), 1 ; CHECK-NEXT: std r4, 0(r3) ; CHECK-NEXT: pstd r4, FuncLocal@PCREL(0), 1 ; CHECK-NEXT: blr entry: store i32 (...)* @Function, i32 (...)** @Func, align 8 store i32 (...)* @Function, i32 (...)** @FuncLocal, align 8 ret void } declare signext i32 @Function(...) define dso_local void @TailCallLocalFuncPtr() local_unnamed_addr { ; CHECK-LABEL: TailCallLocalFuncPtr: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: pld r12, FuncLocal@PCREL(0), 1 ; CHECK-NEXT: mtctr r12 ; CHECK-NEXT: bctr ; CHECK-NEXT: #TC_RETURNr8 ctr 0 entry: %0 = load i32 ()*, i32 ()** bitcast (i32 (...)** @FuncLocal to i32 ()**), align 8 %call = tail call signext i32 %0() ret void } define dso_local void @TailCallExtrnFuncPtr() local_unnamed_addr { ; CHECK-LABEL: TailCallExtrnFuncPtr: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: pld r3, Func@got@pcrel(0), 1 ; CHECK-NEXT: .Lpcrel0: ; CHECK-NEXT: .reloc .Lpcrel0-8,R_PPC64_PCREL_OPT,.-(.Lpcrel0-8) ; CHECK-NEXT: ld r12, 0(r3) ; CHECK-NEXT: mtctr r12 ; CHECK-NEXT: bctr ; CHECK-NEXT: #TC_RETURNr8 ctr 0 entry: %0 = load i32 ()*, i32 ()** bitcast (i32 (...)** @Func to i32 ()**), align 8 %call = tail call signext i32 %0() ret void } define dso_local signext i32 @TailCallParamFuncPtr(i32 (...)* nocapture %passedfunc) local_unnamed_addr { ; CHECK-LABEL: TailCallParamFuncPtr: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: mtctr r3 ; CHECK-NEXT: mr r12, r3 ; CHECK-NEXT: bctr ; CHECK-NEXT: #TC_RETURNr8 ctr 0 entry: %callee.knr.cast = bitcast i32 (...)* %passedfunc to i32 ()* %call = tail call signext i32 %callee.knr.cast() ret i32 %call } define dso_local signext i32 @NoTailIndirectCall(i32 (...)* nocapture %passedfunc, i32 signext %a) local_unnamed_addr { ; CHECK-LABEL: NoTailIndirectCall: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: mflr r0 ; CHECK-NEXT: .cfi_def_cfa_offset 48 ; CHECK-NEXT: .cfi_offset lr, 16 ; CHECK-NEXT: .cfi_offset r30, -16 ; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill ; CHECK-NEXT: std r0, 16(r1) ; CHECK-NEXT: stdu r1, -48(r1) ; CHECK-NEXT: mr r12, r3 ; CHECK-NEXT: mtctr r3 ; CHECK-NEXT: mr r30, r4 ; CHECK-NEXT: bctrl ; CHECK-NEXT: add r3, r3, r30 ; CHECK-NEXT: extsw r3, r3 ; CHECK-NEXT: addi r1, r1, 48 ; CHECK-NEXT: ld r0, 16(r1) ; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload ; CHECK-NEXT: mtlr r0 ; CHECK-NEXT: blr entry: %callee.knr.cast = bitcast i32 (...)* %passedfunc to i32 ()* %call = tail call signext i32 %callee.knr.cast() %add = add nsw i32 %call, %a ret i32 %add } define dso_local signext i32 @TailCallDirect() local_unnamed_addr { ; CHECK-LABEL: TailCallDirect: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: b Function@notoc ; CHECK-NEXT: #TC_RETURNd8 Function@notoc 0 entry: %call = tail call signext i32 bitcast (i32 (...)* @Function to i32 ()*)() ret i32 %call } define dso_local signext i32 @NoTailCallDirect(i32 signext %a) local_unnamed_addr { ; CHECK-LABEL: NoTailCallDirect: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: mflr r0 ; CHECK-NEXT: .cfi_def_cfa_offset 48 ; CHECK-NEXT: .cfi_offset lr, 16 ; CHECK-NEXT: .cfi_offset r30, -16 ; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill ; CHECK-NEXT: std r0, 16(r1) ; CHECK-NEXT: stdu r1, -48(r1) ; CHECK-NEXT: mr r30, r3 ; CHECK-NEXT: bl Function@notoc ; CHECK-NEXT: add r3, r3, r30 ; CHECK-NEXT: extsw r3, r3 ; CHECK-NEXT: addi r1, r1, 48 ; CHECK-NEXT: ld r0, 16(r1) ; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload ; CHECK-NEXT: mtlr r0 ; CHECK-NEXT: blr entry: %call = tail call signext i32 bitcast (i32 (...)* @Function to i32 ()*)() %add = add nsw i32 %call, %a ret i32 %add } define dso_local signext i32 @TailCallDirectLocal() local_unnamed_addr { ; CHECK-LABEL: TailCallDirectLocal: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: b LocalFunction@notoc ; CHECK-NEXT: #TC_RETURNd8 LocalFunction@notoc 0 entry: %call = tail call fastcc signext i32 @LocalFunction() ret i32 %call } define dso_local signext i32 @NoTailCallDirectLocal(i32 signext %a) local_unnamed_addr { ; CHECK-LABEL: NoTailCallDirectLocal: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: mflr r0 ; CHECK-NEXT: .cfi_def_cfa_offset 48 ; CHECK-NEXT: .cfi_offset lr, 16 ; CHECK-NEXT: .cfi_offset r30, -16 ; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill ; CHECK-NEXT: std r0, 16(r1) ; CHECK-NEXT: stdu r1, -48(r1) ; CHECK-NEXT: mr r30, r3 ; CHECK-NEXT: bl LocalFunction@notoc ; CHECK-NEXT: add r3, r3, r30 ; CHECK-NEXT: extsw r3, r3 ; CHECK-NEXT: addi r1, r1, 48 ; CHECK-NEXT: ld r0, 16(r1) ; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload ; CHECK-NEXT: mtlr r0 ; CHECK-NEXT: blr entry: %call = tail call fastcc signext i32 @LocalFunction() %add = add nsw i32 %call, %a ret i32 %add } define dso_local signext i32 @TailCallAbs() local_unnamed_addr { ; CHECK-LABEL: TailCallAbs: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: li r3, 400 ; CHECK-NEXT: li r12, 400 ; CHECK-NEXT: mtctr r3 ; CHECK-NEXT: bctr ; CHECK-NEXT: #TC_RETURNr8 ctr 0 entry: %call = tail call signext i32 inttoptr (i64 400 to i32 ()*)() ret i32 %call } define dso_local signext i32 @NoTailCallAbs(i32 signext %a) local_unnamed_addr { ; CHECK-LABEL: NoTailCallAbs: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: mflr r0 ; CHECK-NEXT: .cfi_def_cfa_offset 48 ; CHECK-NEXT: .cfi_offset lr, 16 ; CHECK-NEXT: .cfi_offset r30, -16 ; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill ; CHECK-NEXT: std r0, 16(r1) ; CHECK-NEXT: stdu r1, -48(r1) ; CHECK-NEXT: mr r30, r3 ; CHECK-NEXT: li r3, 400 ; CHECK-NEXT: li r12, 400 ; CHECK-NEXT: mtctr r3 ; CHECK-NEXT: bctrl ; CHECK-NEXT: add r3, r3, r30 ; CHECK-NEXT: extsw r3, r3 ; CHECK-NEXT: addi r1, r1, 48 ; CHECK-NEXT: ld r0, 16(r1) ; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload ; CHECK-NEXT: mtlr r0 ; CHECK-NEXT: blr entry: %call = tail call signext i32 inttoptr (i64 400 to i32 ()*)() %add = add nsw i32 %call, %a ret i32 %add } ; Function Attrs: noinline ; This function should be tail called and not inlined. define internal fastcc signext i32 @LocalFunction() unnamed_addr #0 { ; CHECK-LABEL: LocalFunction: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: #APP ; CHECK-NEXT: li r3, 42 ; CHECK-NEXT: #NO_APP ; CHECK-NEXT: extsw r3, r3 ; CHECK-NEXT: blr entry: %0 = tail call i32 asm "li $0, 42", "=&r"() ret i32 %0 } attributes #0 = { noinline }