; RUN: llc < %s -relocation-model=static -O1 -disable-ppc-sco=false -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu | FileCheck %s -check-prefix=CHECK-SCO ; RUN: llc < %s -relocation-model=static -O1 -disable-ppc-sco=false -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr8 | FileCheck %s -check-prefix=CHECK-SCO-HASQPX ; RUN: llc < %s -relocation-model=static -O1 -disable-ppc-sco=false -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu -mcpu=pwr8 | FileCheck %s -check-prefix=CHECK-SCO-HASQPX ; RUN: llc < %s -relocation-model=static -O1 -disable-ppc-sco=false -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu -mcpu=pwr8 -code-model=small | FileCheck %s -check-prefix=SCM ; No combination of "powerpc64le-unknown-linux-gnu" + "CHECK-SCO", because ; only Power8 (and later) fully support LE. %S_56 = type { [13 x i32], i32 } %S_64 = type { [15 x i32], i32 } %S_32 = type { [7 x i32], i32 } ; Function Attrs: noinline nounwind define void @callee_56_copy([7 x i64] %a, %S_56* %b) #0 { ret void } define void @callee_64_copy([8 x i64] %a, %S_64* %b) #0 { ret void } ; Function Attrs: nounwind define void @caller_56_reorder_copy(%S_56* %b, [7 x i64] %a) #1 { tail call void @callee_56_copy([7 x i64] %a, %S_56* %b) ret void ; CHECK-SCO-LABEL: caller_56_reorder_copy: ; CHECK-SCO-NOT: stdu 1 ; CHECK-SCO: TC_RETURNd8 callee_56_copy } define void @caller_64_reorder_copy(%S_64* %b, [8 x i64] %a) #1 { tail call void @callee_64_copy([8 x i64] %a, %S_64* %b) ret void ; CHECK-SCO-LABEL: caller_64_reorder_copy: ; CHECK-SCO: bl callee_64_copy } define void @callee_64_64_copy([8 x i64] %a, [8 x i64] %b) #0 { ret void } define void @caller_64_64_copy([8 x i64] %a, [8 x i64] %b) #1 { tail call void @callee_64_64_copy([8 x i64] %a, [8 x i64] %b) ret void ; CHECK-SCO-LABEL: caller_64_64_copy: ; CHECK-SCO: b callee_64_64_copy } define internal fastcc void @callee_64_64_copy_fastcc([8 x i64] %a, [8 x i64] %b) #0 { ret void } define void @caller_64_64_copy_ccc([8 x i64] %a, [8 x i64] %b) #1 { tail call fastcc void @callee_64_64_copy_fastcc([8 x i64] %a, [8 x i64] %b) ret void ; If caller and callee use different calling convensions, we cannot apply TCO. ; CHECK-SCO-LABEL: caller_64_64_copy_ccc: ; CHECK-SCO: bl callee_64_64_copy_fastcc } define void @caller_64_64_reorder_copy([8 x i64] %a, [8 x i64] %b) #1 { tail call void @callee_64_64_copy([8 x i64] %b, [8 x i64] %a) ret void ; CHECK-SCO-LABEL: caller_64_64_reorder_copy: ; CHECK-SCO: bl callee_64_64_copy } define void @caller_64_64_undef_copy([8 x i64] %a, [8 x i64] %b) #1 { tail call void @callee_64_64_copy([8 x i64] %a, [8 x i64] undef) ret void ; CHECK-SCO-LABEL: caller_64_64_undef_copy: ; CHECK-SCO: b callee_64_64_copy } define void @arg8_callee( float %a, i32 signext %b, float %c, i32* %d, i8 zeroext %e, float %f, i32* %g, i32 signext %h) { ret void } define void @arg8_caller(float %a, i32 signext %b, i8 zeroext %c, i32* %d) { entry: tail call void @arg8_callee(float undef, i32 signext undef, float undef, i32* %d, i8 zeroext undef, float undef, i32* undef, i32 signext undef) ret void ; CHECK-SCO-LABEL: arg8_caller: ; CHECK-SCO: b arg8_callee } ; Struct return test ; Function Attrs: noinline nounwind define void @callee_sret_56(%S_56* noalias sret %agg.result) #0 { ret void } define void @callee_sret_32(%S_32* noalias sret %agg.result) #0 { ret void } ; Function Attrs: nounwind define void @caller_do_something_sret_32(%S_32* noalias sret %agg.result) #1 { %1 = alloca %S_56, align 4 %2 = bitcast %S_56* %1 to i8* call void @callee_sret_56(%S_56* nonnull sret %1) tail call void @callee_sret_32(%S_32* sret %agg.result) ret void ; CHECK-SCO-LABEL: caller_do_something_sret_32: ; CHECK-SCO: stdu 1 ; CHECK-SCO: bl callee_sret_56 ; CHECK-SCO: addi 1 ; CHECK-SCO: TC_RETURNd8 callee_sret_32 } define void @caller_local_sret_32(%S_32* %a) #1 { %tmp = alloca %S_32, align 4 tail call void @callee_sret_32(%S_32* nonnull sret %tmp) ret void ; CHECK-SCO-LABEL: caller_local_sret_32: ; CHECK-SCO: bl callee_sret_32 } attributes #0 = { noinline nounwind } attributes #1 = { nounwind } ; vector <4 x i1> test define void @callee_v4i1(i8 %a, <4 x i1> %b, <4 x i1> %c) { ret void } define void @caller_v4i1_reorder(i8 %a, <4 x i1> %b, <4 x i1> %c) { tail call void @callee_v4i1(i8 %a, <4 x i1> %c, <4 x i1> %b) ret void ; <4 x i1> is 32 bytes aligned, if subtarget doesn't support qpx, then we can't ; place b, c to qpx register, so we can't do sco on caller_v4i1_reorder ; CHECK-SCO-LABEL: caller_v4i1_reorder: ; CHECK-SCO: bl callee_v4i1 ; CHECK-SCO-HASQPX-LABEL: caller_v4i1_reorder: ; CHECK-SCO-HASQPX: b callee_v4i1 } define void @f128_callee(i32* %ptr, ppc_fp128 %a, ppc_fp128 %b) { ret void } define void @f128_caller(i32* %ptr, ppc_fp128 %a, ppc_fp128 %b) { tail call void @f128_callee(i32* %ptr, ppc_fp128 %a, ppc_fp128 %b) ret void ; CHECK-SCO-LABEL: f128_caller: ; CHECK-SCO: b f128_callee } ; weak linkage test %class.T = type { [2 x i8] } define weak_odr hidden void @wo_hcallee(%class.T* %this, i8* %c) { ret void } define void @wo_hcaller(%class.T* %this, i8* %c) { tail call void @wo_hcallee(%class.T* %this, i8* %c) ret void ; CHECK-SCO-LABEL: wo_hcaller: ; CHECK-SCO: b wo_hcallee ; SCM-LABEL: wo_hcaller: ; SCM: bl wo_hcallee } define weak_odr protected void @wo_pcallee(%class.T* %this, i8* %c) { ret void } define void @wo_pcaller(%class.T* %this, i8* %c) { tail call void @wo_pcallee(%class.T* %this, i8* %c) ret void ; CHECK-SCO-LABEL: wo_pcaller: ; CHECK-SCO: b wo_pcallee ; SCM-LABEL: wo_pcaller: ; SCM: bl wo_pcallee } define weak_odr void @wo_callee(%class.T* %this, i8* %c) { ret void } define void @wo_caller(%class.T* %this, i8* %c) { tail call void @wo_callee(%class.T* %this, i8* %c) ret void ; CHECK-SCO-LABEL: wo_caller: ; CHECK-SCO: b wo_callee ; SCM-LABEL: wo_caller: ; SCM: bl wo_callee } define weak protected void @w_pcallee(i8* %ptr) { ret void } define void @w_pcaller(i8* %ptr) { tail call void @w_pcallee(i8* %ptr) ret void ; CHECK-SCO-LABEL: w_pcaller: ; CHECK-SCO: b w_pcallee ; SCM-LABEL: w_pcaller: ; SCM: bl w_pcallee } define weak hidden void @w_hcallee(i8* %ptr) { ret void } define void @w_hcaller(i8* %ptr) { tail call void @w_hcallee(i8* %ptr) ret void ; CHECK-SCO-LABEL: w_hcaller: ; CHECK-SCO: b w_hcallee ; SCM-LABEL: w_hcaller: ; SCM: bl w_hcallee } define weak void @w_callee(i8* %ptr) { ret void } define void @w_caller(i8* %ptr) { tail call void @w_callee(i8* %ptr) ret void ; CHECK-SCO-LABEL: w_caller: ; CHECK-SCO: b w_callee ; SCM-LABEL: w_caller: ; SCM: bl w_callee } %struct.byvalTest = type { [8 x i8] } @byval = common global %struct.byvalTest zeroinitializer define void @byval_callee(%struct.byvalTest* byval %ptr) { ret void } define void @byval_caller() { tail call void @byval_callee(%struct.byvalTest* byval @byval) ret void ; CHECK-SCO-LABEL: bl byval_callee ; CHECK-SCO: bl byval_callee }