1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2024-10-22 04:22:57 +02:00
llvm-mirror/test/CodeGen/Hexagon/adjust-latency-stackST.ll
Krzysztof Parzyszek 230c3d0a1e [Hexagon] Adjust latency between allocframe and the first store on stack
Allocframe and the following stores on the stack have a latency of 2 cycles
when not in the same packet. This happens because R29 is needed early by the
store instruction. Since one of such stores can be packetized along with
allocframe and use old value of R29, we can assign it 0 cycle latency
while leaving latency of other stores to the default value of 2 cycles.

Patch by Jyotsna Verma.

llvm-svn: 302034
2017-05-03 15:33:09 +00:00

82 lines
3.3 KiB
LLVM

; RUN: llc -march=hexagon -disable-post-ra < %s | FileCheck %s
; Make sure that if there's only one store to the stack, it gets packetized
; with allocframe as there's a latency of 2 cycles between allocframe and
; the following store if not in the same packet.
; CHECK: {
; CHECK: memd(r29
; CHECK-NOT: {
; CHECK: allocframe
; CHECK: }
; CHECK: = memw(gp+#G)
%struct.0 = type { %struct.0*, i32, %struct.2 }
%struct.1 = type { i32, i32, [31 x i8] }
%struct.2 = type { %struct.1 }
@G = common global %struct.0* null, align 4
define i32 @test(%struct.0* nocapture %a0) #0 {
b1:
%v2 = alloca %struct.0*, align 4
%v3 = bitcast %struct.0** %v2 to i8*
%v4 = getelementptr inbounds %struct.0, %struct.0* %a0, i32 0, i32 0
%v5 = load %struct.0*, %struct.0** %v4, align 4
store %struct.0* %v5, %struct.0** %v2, align 4
%v6 = bitcast %struct.0* %v5 to i8*
%v7 = load i8*, i8** bitcast (%struct.0** @G to i8**), align 4
tail call void @llvm.memcpy.p0i8.p0i8.i32(i8* %v6, i8* %v7, i32 48, i32 4, i1 false)
%v8 = getelementptr inbounds %struct.0, %struct.0* %a0, i32 0, i32 2, i32 0, i32 1
store i32 5, i32* %v8, align 4
%v9 = getelementptr inbounds %struct.0, %struct.0* %v5, i32 0, i32 2, i32 0, i32 1
store i32 5, i32* %v9, align 4
%v10 = bitcast %struct.0* %a0 to i32*
%v11 = load i32, i32* %v10, align 4
%v12 = bitcast %struct.0* %v5 to i32*
store i32 %v11, i32* %v12, align 4
%v13 = call i32 bitcast (i32 (...)* @f0 to i32 (%struct.0**)*)(%struct.0** nonnull %v2)
%v14 = load %struct.0*, %struct.0** %v2, align 4
%v15 = getelementptr inbounds %struct.0, %struct.0* %v14, i32 0, i32 1
%v16 = load i32, i32* %v15, align 4
%v17 = icmp eq i32 %v16, 0
br i1 %v17, label %b18, label %b32
b18: ; preds = %b1
%v19 = bitcast %struct.0** %v2 to i32**
%v20 = getelementptr inbounds %struct.0, %struct.0* %v14, i32 0, i32 2, i32 0, i32 1
store i32 6, i32* %v20, align 4
%v21 = getelementptr inbounds %struct.0, %struct.0* %a0, i32 0, i32 2, i32 0, i32 0
%v22 = load i32, i32* %v21, align 4
%v23 = getelementptr inbounds %struct.0, %struct.0* %v14, i32 0, i32 2, i32 0, i32 0
%v24 = call i32 bitcast (i32 (...)* @f1 to i32 (i32, i32*)*)(i32 %v22, i32* %v23)
%v25 = load i32*, i32** bitcast (%struct.0** @G to i32**), align 4
%v26 = load i32, i32* %v25, align 4
%v27 = load i32*, i32** %v19, align 4
store i32 %v26, i32* %v27, align 4
%v28 = load %struct.0*, %struct.0** %v2, align 4
%v29 = getelementptr inbounds %struct.0, %struct.0* %v28, i32 0, i32 2, i32 0, i32 1
%v30 = load i32, i32* %v29, align 4
%v31 = call i32 bitcast (i32 (...)* @f2 to i32 (i32, i32, i32*)*)(i32 %v30, i32 10, i32* %v29)
br label %b36
b32: ; preds = %b1
%v33 = bitcast %struct.0* %a0 to i8**
%v34 = load i8*, i8** %v33, align 4
%v35 = bitcast %struct.0* %a0 to i8*
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %v35, i8* %v34, i32 48, i32 4, i1 false)
br label %b36
b36: ; preds = %b32, %b18
ret i32 undef
}
declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture writeonly, i8* nocapture readonly, i32, i32, i1) #1
declare i32 @f0(...) #0
declare i32 @f1(...) #0
declare i32 @f2(...) #0
attributes #0 = { nounwind }
attributes #1 = { argmemonly nounwind }