mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-31 12:41:49 +01:00
[CodeGen] Enable tail call position check for speculatable functions
In the function "Analysis.cpp:isInTailCallPosition", it only checks whether a call is in a tail call position if the call has side effects, access memory or it is not safe to speculative execute. Therefore, a speculatable function will not go through tail call position check and improperly tail called when it is not in a tail-call position. This patch enables tail call position check for speculatable functions. Differential Revision: https://reviews.llvm.org/D80661
This commit is contained in:
parent
070c26f0c5
commit
14cc6c217a
@ -530,24 +530,23 @@ bool llvm::isInTailCallPosition(const CallBase &Call, const TargetMachine &TM) {
|
||||
|
||||
// If I will have a chain, make sure no other instruction that will have a
|
||||
// chain interposes between I and the return.
|
||||
if (Call.mayHaveSideEffects() || Call.mayReadFromMemory() ||
|
||||
!isSafeToSpeculativelyExecute(&Call))
|
||||
for (BasicBlock::const_iterator BBI = std::prev(ExitBB->end(), 2);; --BBI) {
|
||||
if (&*BBI == &Call)
|
||||
break;
|
||||
// Debug info intrinsics do not get in the way of tail call optimization.
|
||||
if (isa<DbgInfoIntrinsic>(BBI))
|
||||
// Check for all calls including speculatable functions.
|
||||
for (BasicBlock::const_iterator BBI = std::prev(ExitBB->end(), 2);; --BBI) {
|
||||
if (&*BBI == &Call)
|
||||
break;
|
||||
// Debug info intrinsics do not get in the way of tail call optimization.
|
||||
if (isa<DbgInfoIntrinsic>(BBI))
|
||||
continue;
|
||||
// A lifetime end or assume intrinsic should not stop tail call
|
||||
// optimization.
|
||||
if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(BBI))
|
||||
if (II->getIntrinsicID() == Intrinsic::lifetime_end ||
|
||||
II->getIntrinsicID() == Intrinsic::assume)
|
||||
continue;
|
||||
// A lifetime end or assume intrinsic should not stop tail call
|
||||
// optimization.
|
||||
if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(BBI))
|
||||
if (II->getIntrinsicID() == Intrinsic::lifetime_end ||
|
||||
II->getIntrinsicID() == Intrinsic::assume)
|
||||
continue;
|
||||
if (BBI->mayHaveSideEffects() || BBI->mayReadFromMemory() ||
|
||||
!isSafeToSpeculativelyExecute(&*BBI))
|
||||
return false;
|
||||
}
|
||||
if (BBI->mayHaveSideEffects() || BBI->mayReadFromMemory() ||
|
||||
!isSafeToSpeculativelyExecute(&*BBI))
|
||||
return false;
|
||||
}
|
||||
|
||||
const Function *F = ExitBB->getParent();
|
||||
return returnTypeIsEligibleForTailCall(
|
||||
|
96
test/CodeGen/PowerPC/tailcall-speculatable-callee.ll
Normal file
96
test/CodeGen/PowerPC/tailcall-speculatable-callee.ll
Normal file
@ -0,0 +1,96 @@
|
||||
; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
|
||||
; RUN: -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | FileCheck %s
|
||||
|
||||
; The tests check the behavior of the tail call decision when the callee is speculatable.
|
||||
|
||||
; Callee should be tail called in this function since it is at a tail call position.
|
||||
define dso_local double @speculatable_callee_return_use_only (double* nocapture %res, double %a) #0 {
|
||||
; CHECK-LABEL: speculatable_callee_return_use_only:
|
||||
; CHECK: # %bb.0: # %entry
|
||||
; CHECK-NEXT: b callee
|
||||
entry:
|
||||
%value = tail call double @callee(double %a) #2
|
||||
ret double %value
|
||||
}
|
||||
|
||||
; Callee should not be tail called since it is not at a tail call position.
|
||||
define dso_local void @speculatable_callee_non_return_use_only (double* nocapture %res, double %a) #0 {
|
||||
; CHECK-LABEL: speculatable_callee_non_return_use_only:
|
||||
; CHECK: # %bb.0: # %entry
|
||||
; CHECK-NEXT: mflr r0
|
||||
; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill
|
||||
; CHECK-NEXT: std r0, 16(r1)
|
||||
; CHECK-NEXT: stdu r1, -48(r1)
|
||||
; CHECK-NEXT: mr r30, r3
|
||||
; CHECK-NEXT: bl callee
|
||||
; CHECK-NEXT: stfdx f1, 0, r30
|
||||
; CHECK-NEXT: addi r1, r1, 48
|
||||
; CHECK-NEXT: ld r0, 16(r1)
|
||||
; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload
|
||||
; CHECK-NEXT: mtlr r0
|
||||
; CHECK-NEXT: blr
|
||||
entry:
|
||||
%call = tail call double @callee(double %a) #2
|
||||
store double %call, double* %res, align 8
|
||||
ret void
|
||||
}
|
||||
|
||||
; Callee should not be tail called since it is not at a tail call position.
|
||||
define dso_local double @speculatable_callee_multi_use (double* nocapture %res, double %a) #0 {
|
||||
; CHECK-LABEL: speculatable_callee_multi_use:
|
||||
; CHECK: # %bb.0: # %entry
|
||||
; CHECK-NEXT: mflr r0
|
||||
; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill
|
||||
; CHECK-NEXT: std r0, 16(r1)
|
||||
; CHECK-NEXT: stdu r1, -48(r1)
|
||||
; CHECK-NEXT: mr r30, r3
|
||||
; CHECK-NEXT: bl callee
|
||||
; CHECK-NEXT: stfdx f1, 0, r30
|
||||
; CHECK-NEXT: addi r1, r1, 48
|
||||
; CHECK-NEXT: ld r0, 16(r1)
|
||||
; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload
|
||||
; CHECK-NEXT: mtlr r0
|
||||
; CHECK-NEXT: blr
|
||||
entry:
|
||||
%call = tail call double @callee(double %a) #2
|
||||
store double %call, double* %res, align 8
|
||||
ret double %call
|
||||
}
|
||||
|
||||
; Callee should not be tail called since it is not at a tail call position.
|
||||
; FIXME: A speculatable callee can be tail called if it is moved into a valid tail call position.
|
||||
define dso_local double @speculatable_callee_intermediate_instructions (double* nocapture %res, double %a) #0 {
|
||||
; CHECK-LABEL: speculatable_callee_intermediate_instructions:
|
||||
; CHECK: # %bb.0: # %entry
|
||||
; CHECK-NEXT: mflr r0
|
||||
; CHECK-NEXT: std r30, -16(r1) # 8-byte Folded Spill
|
||||
; CHECK-NEXT: std r0, 16(r1)
|
||||
; CHECK-NEXT: stdu r1, -48(r1)
|
||||
; CHECK-NEXT: mr r30, r3
|
||||
; CHECK-NEXT: bl callee
|
||||
; CHECK-NEXT: lis r3, 16404
|
||||
; CHECK-NEXT: ori r3, r3, 52428
|
||||
; CHECK-NEXT: sldi r3, r3, 32
|
||||
; CHECK-NEXT: oris r3, r3, 52428
|
||||
; CHECK-NEXT: ori r3, r3, 52429
|
||||
; CHECK-NEXT: std r3, 0(r30)
|
||||
; CHECK-NEXT: addi r1, r1, 48
|
||||
; CHECK-NEXT: ld r0, 16(r1)
|
||||
; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload
|
||||
; CHECK-NEXT: mtlr r0
|
||||
; CHECK-NEXT: blr
|
||||
|
||||
entry:
|
||||
%call = tail call double @callee(double %a) #2
|
||||
store double 5.2, double* %res, align 8
|
||||
ret double %call
|
||||
}
|
||||
|
||||
|
||||
define double @callee(double) #1 {
|
||||
ret double 4.5
|
||||
}
|
||||
|
||||
attributes #0 = { nounwind }
|
||||
attributes #1 = { readnone speculatable }
|
||||
attributes #2 = { nounwind noinline }
|
Loading…
x
Reference in New Issue
Block a user