1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2024-11-22 18:54:02 +01:00
llvm-mirror/test/CodeGen/PowerPC/p10-constants.ll
Amy Kwan d439d93cd1 [PowerPC] Materialize 34-bit constants with pli directly
Previously, 34-bit constants were materialized in selectI64Imm(), and we relied
on td pattern matching to instead produce a pli. This becomes problematic as
there is no guarantee that the 34-bit constant will reach the td pattern
selection for pli. It is also possible for other transformations (such as complex
bit permutations) to also produce and utilize the 34-bit constant materialized
through selectI64Imm().

This patch instead produces pli on Power10 directly whenever the constant fits
within 34-bits.

Differential Revision: https://reviews.llvm.org/D99906
2021-04-06 13:38:11 -05:00

393 lines
9.3 KiB
LLVM

; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | \
; RUN: FileCheck %s
; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu \
; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | \
; RUN: FileCheck %s
; RUN: llc -verify-machineinstrs -mtriple=powerpc-unknown-linux-gnu \
; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | \
; RUN: FileCheck %s --check-prefix=CHECK32
; These test cases aim to test constant materialization using the pli instruction on Power10.
define signext i32 @t_16BitsMinRequiring34Bits() {
; CHECK-LABEL: t_16BitsMinRequiring34Bits:
; CHECK: pli r3, 32768
; CHECK-NEXT: blr
; CHECK32-LABEL: t_16BitsMinRequiring34Bits:
; CHECK32: pli r3, 32768
; CHECK32-NEXT: blr
entry:
ret i32 32768
}
define signext i32 @t_16Bits() {
; CHECK-LABEL: t_16Bits:
; CHECK: pli r3, 62004
; CHECK-NEXT: blr
; CHECK32-LABEL: t_16Bits:
; CHECK32: pli r3, 62004
; CHECK32-NEXT: blr
entry:
ret i32 62004
}
define signext i32 @t_lt32gt16BitsNonShiftable() {
; CHECK-LABEL: t_lt32gt16BitsNonShiftable:
; CHECK: pli r3, 1193046
; CHECK-NEXT: blr
; CHECK32-LABEL: t_lt32gt16BitsNonShiftable:
; CHECK32: pli r3, 1193046
; CHECK32-NEXT: blr
entry:
ret i32 1193046
}
define signext i32 @t_32Bits() {
; CHECK-LABEL: t_32Bits:
; CHECK: pli r3, -231451016
; CHECK-NEXT: blr
; CHECK32-LABEL: t_32Bits:
; CHECK32: pli r3, -231451016
; CHECK32-NEXT: blr
entry:
ret i32 -231451016
}
define i64 @t_34BitsLargestPositive() {
; CHECK-LABEL: t_34BitsLargestPositive:
; CHECK: pli r3, 8589934591
; CHECK-NEXT: blr
; CHECK32-LABEL: t_34BitsLargestPositive:
; CHECK32: li r3, 1
; CHECK32-NEXT: li r4, -1
; CHECK32-NEXT: blr
entry:
ret i64 8589934591
}
define i64 @t_neg34Bits() {
; CHECK-LABEL: t_neg34Bits:
; CHECK: pli r3, -8284514696
; CHECK-NEXT: blr
; CHECK32-LABEL: t_neg34Bits:
; CHECK32: li r3, -2
; CHECK32-NEXT: pli r4, 305419896
; CHECK32-NEXT: blr
entry:
ret i64 -8284514696
}
define signext i32 @t_16BitsMinRequiring34BitsMinusOne() {
; CHECK-LABEL: t_16BitsMinRequiring34BitsMinusOne:
; CHECK: li r3, 32767
; CHECK-NEXT: blr
; CHECK32-LABEL: t_16BitsMinRequiring34BitsMinusOne:
; CHECK32: li r3, 32767
; CHECK32-NEXT: blr
entry:
ret i32 32767
}
define signext i32 @t_lt16Bits() {
; CHECK-LABEL: t_lt16Bits:
; CHECK: li r3, 291
; CHECK-NEXT: blr
; CHECK32-LABEL: t_lt16Bits:
; CHECK32: li r3, 291
; CHECK32-NEXT: blr
entry:
ret i32 291
}
define signext i32 @t_neglt16Bits() {
; CHECK-LABEL: t_neglt16Bits:
; CHECK: li r3, -3805
; CHECK-NEXT: blr
; CHECK32-LABEL: t_neglt16Bits:
; CHECK32: li r3, -3805
; CHECK32-NEXT: blr
entry:
ret i32 -3805
}
define signext i32 @t_neg16Bits() {
; CHECK-LABEL: t_neg16Bits:
; CHECK: li r3, -32204
; CHECK-NEXT: blr
; CHECK32-LABEL: t_neg16Bits:
; CHECK32: li r3, -32204
; CHECK32-NEXT: blr
entry:
ret i32 -32204
}
define signext i32 @t_lt32gt16BitsShiftable() {
; CHECK-LABEL: t_lt32gt16BitsShiftable:
; CHECK: lis r3, 18
; CHECK-NEXT: blr
; CHECK32-LABEL: t_lt32gt16BitsShiftable:
; CHECK32: lis r3, 18
; CHECK32-NEXT: blr
entry:
ret i32 1179648
}
define signext i32 @t_32gt16BitsShiftable() {
; CHECK-LABEL: t_32gt16BitsShiftable:
; CHECK: lis r3, -3532
; CHECK-NEXT: blr
; CHECK32-LABEL: t_32gt16BitsShiftable:
; CHECK32: lis r3, -3532
; CHECK32-NEXT: blr
entry:
ret i32 -231473152
}
define signext i32 @t_32BitsZero() {
; CHECK-LABEL: t_32BitsZero:
; CHECK: li r3, 0
; CHECK-NEXT: blr
; CHECK32-LABEL: t_32BitsZero:
; CHECK32: li r3, 0
; CHECK32-NEXT: blr
entry:
ret i32 0
}
define signext i32 @t_32BitsAllOnes() {
; CHECK-LABEL: t_32BitsAllOnes:
; CHECK: li r3, -1
; CHECK-NEXT: blr
; CHECK32-LABEL: t_32BitsAllOnes:
; CHECK32: li r3, -1
; CHECK32-NEXT: blr
entry:
ret i32 -1
}
define i64 @t_34BitsLargestPositivePlus() {
; CHECK-LABEL: t_34BitsLargestPositivePlus:
; CHECK: li r3, 1
; CHECK-NEXT: rldic r3, r3, 33, 30
; CHECK-NEXT: blr
; CHECK32-LABEL: t_34BitsLargestPositivePlus:
; CHECK32: li r3, 2
; CHECK32-NEXT: li r4, 0
; CHECK32-NEXT: blr
entry:
ret i64 8589934592
}
define i64 @t_34Bits() {
; CHECK-LABEL: t_34Bits:
; CHECK: pli r3, 1648790223
; CHECK-NEXT: rldic r3, r3, 3, 30
; CHECK-NEXT: blr
; CHECK32-LABEL: t_34Bits:
; CHECK32: li r3, 3
; CHECK32-NEXT: pli r4, 305419896
; CHECK32-NEXT: blr
entry:
ret i64 13190321784
}
define i64 @t_35Bits() {
; CHECK-LABEL: t_35Bits:
; CHECK: pli r3, 4266035919
; CHECK-NEXT: rldic r3, r3, 3, 29
; CHECK-NEXT: blr
; CHECK32-LABEL: t_35Bits:
; CHECK32: li r3, 7
; CHECK32-NEXT: pli r4, -231451016
; CHECK32-NEXT: blr
entry:
ret i64 34128287352
}
; (Value >> Shift) can be expressed in 34 bits
define i64 @t_Shift() {
; CHECK-LABEL: t_Shift:
; CHECK: pli r3, 8522759166
; CHECK-NEXT: rotldi r3, r3, 48
; CHECK-NEXT: blr
entry:
; 0xFBFE00000001FBFE
ret i64 18157950747604548606
}
; Leading Zeros + Following Ones + Trailing Zeros > 30
define i64 @t_LZFOTZ() {
; CHECK-LABEL: t_LZFOTZ:
; CHECK: pli r3, -349233
; CHECK-NEXT: rldic r3, r3, 4, 12
; CHECK-NEXT: blr
entry:
; 0x000FFFFFFFAABCF0
ret i64 4503599621782768
}
; Leading Zeros + Trailing Ones > 30
define i64 @t_LZTO() {
; CHECK-LABEL: t_LZTO:
; CHECK: pli r3, -2684406441
; CHECK-NEXT: rldicl r3, r3, 11, 19
; CHECK-NEXT: blr
entry:
; 0x00001AFFF9AABFFF
ret i64 29686707699711
}
; Leading Zeros + Trailing Ones + Following Zeros > 30
define i64 @t_LZTOFO() {
; CHECK-LABEL: t_LZTOFO:
; CHECK: pli r3, -5720033968
; CHECK-NEXT: rldicl r3, r3, 11, 12
; CHECK-NEXT: blr
entry:
; 0x000FF55879AA87FF
ret i64 4491884997806079
}
; Requires full expansion
define i64 @t_Full64Bits1() {
; CHECK-LABEL: t_Full64Bits1:
; CHECK: pli r4, 2146500607
; CHECK-NEXT: pli r3, 4043305214
; CHECK-NEXT: rldimi r3, r4, 32, 0
; CHECK-NEXT: blr
entry:
; 0x7FF0FFFFF0FFF0FE
ret i64 9219149911952453886
}
; Requires full expansion
define i64 @t_Ful64Bits2() {
; CHECK-LABEL: t_Ful64Bits2:
; CHECK: pli r4, 4042326015
; CHECK-NEXT: pli r3, 4043305214
; CHECK-NEXT: rldimi r3, r4, 32, 0
; CHECK-NEXT: blr
entry:
; 0xF0F0FFFFF0FFF0FE
ret i64 17361658038238310654
}
; A splat of 32 bits: 32 Bits Low == 32 Bits High
define i64 @t_Splat32Bits() {
; CHECK-LABEL: t_Splat32Bits:
; CHECK: pli r3, 262916796
; CHECK-NEXT: rldimi r3, r3, 32, 0
; CHECK-NEXT: blr
entry:
; 0x0FABCABC0FABCABC
ret i64 1129219040652020412
}
; Producing `pli` when the constant fits within 34-bits and the constant
; is being produced in other transformations (such as complex bit permutations).
define i64 @t_34Bits_Complex(i64 %a, i64 %b) {
; CHECK-LABEL: t_34Bits_Complex:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: rotldi r4, r4, 30
; CHECK-NEXT: rldimi r3, r4, 34, 31
; CHECK-NEXT: pli r4, -268435457
; CHECK-NEXT: and r3, r3, r4
; CHECK-NEXT: blr
;
; CHECK32-LABEL: t_34Bits_Complex:
; CHECK32: # %bb.0: # %entry
; CHECK32-NEXT: rlwinm r4, r6, 0, 4, 2
; CHECK32-NEXT: rlwimi r3, r5, 0, 31, 29
; CHECK32-NEXT: blr
entry:
%and = and i64 %a, 8589934592
%and1 = and i64 %b, -8858370049
%or = or i64 %and1, %and
ret i64 %or
}
; The load immediates resulting from phi-nodes are needed to test whether
; li/lis is preferred to pli by the instruction selector.
define dso_local void @t_phiNode() {
; CHECK-LABEL: t_phiNode:
; CHECK: lis r6, 18
; CHECK-NEXT: li r5, 291
; CHECK-NEXT: li r4, 0
; CHECK-NEXT: cmpwi r3, 1
; CHECK-NEXT: li r3, -1
; CHECK: pli r6, 2147483647
; CHECK-NEXT: pli r5, 1193046
; CHECK-NEXT: pli r4, 32768
; CHECK-NEXT: pli r3, -231451016
; CHECK32-LABEL: t_phiNode:
; CHECK32: lis r6, 18
; CHECK32-NEXT: li r5, 291
; CHECK32-NEXT: li r4, 0
; CHECK32-NEXT: cmpwi r3, 1
; CHECK32-NEXT: li r3, -1
; CHECK32: pli r6, 2147483647
; CHECK32-NEXT: pli r5, 1193046
; CHECK32-NEXT: pli r4, 32768
; CHECK32-NEXT: pli r3, -231451016
entry:
br label %while.body
while.body: ; preds = %if.else.i, %entry
br label %while.body.i
while.body.i: ; preds = %sw.epilog.i, %while.body
%a.1.i = phi i32 [ %a.2.i, %sw.epilog.i ], [ -1, %while.body ]
%b.1.i = phi i32 [ %b.2.i, %sw.epilog.i ], [ 0, %while.body ]
%c.1.i = phi i32 [ %c.2.i, %sw.epilog.i ], [ 291, %while.body ]
%d.1.i = phi i32 [ %d.2.i, %sw.epilog.i ], [ 1179648, %while.body ]
%0 = load i8, i8* null, align 1
%cmp1.i = icmp eq i8 %0, 1
br i1 %cmp1.i, label %if.then.i, label %if.else.i
if.then.i: ; preds = %while.body.i
switch i8 undef, label %sw.default.i [
i8 3, label %sw.epilog.i
i8 2, label %sw.bb1.i
]
sw.bb1.i: ; preds = %if.then.i
br label %sw.epilog.i
sw.default.i: ; preds = %if.then.i
unreachable
sw.epilog.i: ; preds = %sw.bb2.i, %sw.bb1.i, %if.then.i
%a.2.i = phi i32 [ -231451016, %sw.bb1.i ], [ %a.1.i, %if.then.i ]
%b.2.i = phi i32 [ 32768, %sw.bb1.i ], [ %b.1.i, %if.then.i ]
%c.2.i = phi i32 [ 1193046, %sw.bb1.i ], [ %c.1.i, %if.then.i ]
%d.2.i = phi i32 [ 2147483647, %sw.bb1.i ], [ %d.1.i, %if.then.i ]
br label %while.body.i
if.else.i: ; preds = %while.body.i
call void @func2(i32 signext %a.1.i, i32 signext %b.1.i, i32 signext %c.1.i, i32 signext %d.1.i)
br label %while.body
}
declare void @func2(i32, i32, i32, i32)