mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 19:23:23 +01:00
Improve handling of immediates by splitting 32-bit immediates into two 16-bit
immediate operands when they will fit into the using instruction. llvm-svn: 84778
This commit is contained in:
parent
23ea13afbb
commit
452de96b04
@ -341,6 +341,66 @@ namespace ARM_AM {
|
||||
return -1;
|
||||
}
|
||||
|
||||
static inline unsigned getT2SOImmValRotate(unsigned V) {
|
||||
if ((V & ~255U) == 0) return 0;
|
||||
// Use CTZ to compute the rotate amount.
|
||||
unsigned RotAmt = CountTrailingZeros_32(V);
|
||||
return (32 - RotAmt) & 31;
|
||||
}
|
||||
|
||||
static inline bool isT2SOImmTwoPartVal (unsigned Imm) {
|
||||
unsigned V = Imm;
|
||||
// Passing values can be any combination of splat values and shifter
|
||||
// values. If this can be handled with a single shifter or splat, bail
|
||||
// out. Those should be handled directly, not with a two-part val.
|
||||
if (getT2SOImmValSplatVal(V) != -1)
|
||||
return false;
|
||||
V = rotr32 (~255U, getT2SOImmValRotate(V)) & V;
|
||||
if (V == 0)
|
||||
return false;
|
||||
|
||||
// If this can be handled as an immediate, accept.
|
||||
if (getT2SOImmVal(V) != -1) return true;
|
||||
|
||||
// Likewise, try masking out a splat value first.
|
||||
V = Imm;
|
||||
if (getT2SOImmValSplatVal(V & 0xff00ff00U) != -1)
|
||||
V &= ~0xff00ff00U;
|
||||
else if (getT2SOImmValSplatVal(V & 0x00ff00ffU) != -1)
|
||||
V &= ~0x00ff00ffU;
|
||||
// If what's left can be handled as an immediate, accept.
|
||||
if (getT2SOImmVal(V) != -1) return true;
|
||||
|
||||
// Otherwise, do not accept.
|
||||
return false;
|
||||
}
|
||||
|
||||
static inline unsigned getT2SOImmTwoPartFirst(unsigned Imm) {
|
||||
assert (isT2SOImmTwoPartVal(Imm) &&
|
||||
"Immedate cannot be encoded as two part immediate!");
|
||||
// Try a shifter operand as one part
|
||||
unsigned V = rotr32 (~255, getT2SOImmValRotate(Imm)) & Imm;
|
||||
// If the rest is encodable as an immediate, then return it.
|
||||
if (getT2SOImmVal(V) != -1) return V;
|
||||
|
||||
// Try masking out a splat value first.
|
||||
if (getT2SOImmValSplatVal(Imm & 0xff00ff00U) != -1)
|
||||
return Imm & 0xff00ff00U;
|
||||
|
||||
// The other splat is all that's left as an option.
|
||||
assert (getT2SOImmValSplatVal(Imm & 0x00ff00ffU) != -1);
|
||||
return Imm & 0x00ff00ffU;
|
||||
}
|
||||
|
||||
static inline unsigned getT2SOImmTwoPartSecond(unsigned Imm) {
|
||||
// Mask out the first hunk
|
||||
Imm ^= getT2SOImmTwoPartFirst(Imm);
|
||||
// Return what's left
|
||||
assert (getT2SOImmVal(Imm) != -1 &&
|
||||
"Unable to encode second part of T2 two part SO immediate");
|
||||
return Imm;
|
||||
}
|
||||
|
||||
|
||||
//===--------------------------------------------------------------------===//
|
||||
// Addressing Mode #2
|
||||
|
@ -1583,6 +1583,12 @@ def : ARMPat<(or GPR:$LHS, so_imm2part:$RHS),
|
||||
def : ARMPat<(xor GPR:$LHS, so_imm2part:$RHS),
|
||||
(EORri (EORri GPR:$LHS, (so_imm2part_1 imm:$RHS)),
|
||||
(so_imm2part_2 imm:$RHS))>;
|
||||
def : ARMPat<(add GPR:$LHS, so_imm2part:$RHS),
|
||||
(ADDri (ADDri GPR:$LHS, (so_imm2part_1 imm:$RHS)),
|
||||
(so_imm2part_2 imm:$RHS))>;
|
||||
def : ARMPat<(sub GPR:$LHS, so_imm2part:$RHS),
|
||||
(SUBri (SUBri GPR:$LHS, (so_imm2part_1 imm:$RHS)),
|
||||
(so_imm2part_2 imm:$RHS))>;
|
||||
|
||||
// 32-bit immediate using movw + movt.
|
||||
// This is a single pseudo instruction, the benefit is that it can be remat'd
|
||||
|
@ -69,6 +69,25 @@ def t2_so_imm_neg : Operand<i32>,
|
||||
return ARM_AM::getT2SOImmVal(-((int)N->getZExtValue())) != -1;
|
||||
}], t2_so_imm_neg_XFORM>;
|
||||
|
||||
// Break t2_so_imm's up into two pieces. This handles immediates with up to 16
|
||||
// bits set in them. This uses t2_so_imm2part to match and t2_so_imm2part_[12]
|
||||
// to get the first/second pieces.
|
||||
def t2_so_imm2part : Operand<i32>,
|
||||
PatLeaf<(imm), [{
|
||||
return ARM_AM::isT2SOImmTwoPartVal((unsigned)N->getZExtValue());
|
||||
}]> {
|
||||
}
|
||||
|
||||
def t2_so_imm2part_1 : SDNodeXForm<imm, [{
|
||||
unsigned V = ARM_AM::getT2SOImmTwoPartFirst((unsigned)N->getZExtValue());
|
||||
return CurDAG->getTargetConstant(V, MVT::i32);
|
||||
}]>;
|
||||
|
||||
def t2_so_imm2part_2 : SDNodeXForm<imm, [{
|
||||
unsigned V = ARM_AM::getT2SOImmTwoPartSecond((unsigned)N->getZExtValue());
|
||||
return CurDAG->getTargetConstant(V, MVT::i32);
|
||||
}]>;
|
||||
|
||||
/// imm1_31 predicate - True if the 32-bit immediate is in the range [1,31].
|
||||
def imm1_31 : PatLeaf<(i32 imm), [{
|
||||
return (int32_t)N->getZExtValue() >= 1 && (int32_t)N->getZExtValue() < 32;
|
||||
@ -1131,6 +1150,20 @@ def t2IT : Thumb2XI<(outs), (ins it_pred:$cc, it_mask:$mask),
|
||||
// Non-Instruction Patterns
|
||||
//
|
||||
|
||||
// Two piece so_imms.
|
||||
def : T2Pat<(or GPR:$LHS, t2_so_imm2part:$RHS),
|
||||
(t2ORRri (t2ORRri GPR:$LHS, (t2_so_imm2part_1 imm:$RHS)),
|
||||
(t2_so_imm2part_2 imm:$RHS))>;
|
||||
def : T2Pat<(xor GPR:$LHS, t2_so_imm2part:$RHS),
|
||||
(t2EORri (t2EORri GPR:$LHS, (t2_so_imm2part_1 imm:$RHS)),
|
||||
(t2_so_imm2part_2 imm:$RHS))>;
|
||||
def : T2Pat<(add GPR:$LHS, t2_so_imm2part:$RHS),
|
||||
(t2ADDri (t2ADDri GPR:$LHS, (t2_so_imm2part_1 imm:$RHS)),
|
||||
(t2_so_imm2part_2 imm:$RHS))>;
|
||||
def : T2Pat<(sub GPR:$LHS, t2_so_imm2part:$RHS),
|
||||
(t2SUBri (t2SUBri GPR:$LHS, (t2_so_imm2part_1 imm:$RHS)),
|
||||
(t2_so_imm2part_2 imm:$RHS))>;
|
||||
|
||||
// ConstantPool, GlobalAddress, and JumpTable
|
||||
def : T2Pat<(ARMWrapper tglobaladdr :$dst), (t2LEApcrel tglobaladdr :$dst)>;
|
||||
def : T2Pat<(ARMWrapper tconstpool :$dst), (t2LEApcrel tconstpool :$dst)>;
|
||||
|
@ -10,29 +10,32 @@ define i32 @t2_const_var2_1_ok_1(i32 %lhs) {
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_1_fail_1(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_fail_1:
|
||||
;CHECK: movt
|
||||
define i32 @t2_const_var2_1_ok_2(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_ok_2:
|
||||
;CHECK: #11206656
|
||||
;CHECK: #187
|
||||
%ret = add i32 %lhs, 11206843 ; 0x00ab00bb
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_1_fail_2(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_fail_2:
|
||||
;CHECK: movt
|
||||
define i32 @t2_const_var2_1_ok_3(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_ok_3:
|
||||
;CHECK: #11206827
|
||||
;CHECK: #16777216
|
||||
%ret = add i32 %lhs, 27984043 ; 0x01ab00ab
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_1_fail_3(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_fail_3:
|
||||
;CHECK: movt
|
||||
define i32 @t2_const_var2_1_ok_4(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_ok_4:
|
||||
;CHECK: #16777472
|
||||
;CHECK: #11206827
|
||||
%ret = add i32 %lhs, 27984299 ; 0x01ab01ab
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_1_fail_4(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_fail_4:
|
||||
define i32 @t2_const_var2_1_fail_1(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_1_fail_1:
|
||||
;CHECK: movt
|
||||
%ret = add i32 %lhs, 28027649 ; 0x01abab01
|
||||
ret i32 %ret
|
||||
@ -46,29 +49,31 @@ define i32 @t2_const_var2_2_ok_1(i32 %lhs) {
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_2_fail_1(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_fail_1:
|
||||
;CHECK: movt
|
||||
define i32 @t2_const_var2_2_ok_2(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_ok_2:
|
||||
;CHECK: #-1426063360
|
||||
;CHECK: #47616
|
||||
%ret = add i32 %lhs, 2868951552 ; 0xab00ba00
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_2_fail_2(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_fail_2:
|
||||
;CHECK: movt
|
||||
define i32 @t2_const_var2_2_ok_3(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_ok_3:
|
||||
;CHECK: #-1426019584
|
||||
%ret = add i32 %lhs, 2868947728 ; 0xab00ab10
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_2_fail_3(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_fail_3:
|
||||
;CHECK: movt
|
||||
define i32 @t2_const_var2_2_ok_4(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_ok_4:
|
||||
;CHECK: #-1426019584
|
||||
;CHECK: #1048592
|
||||
%ret = add i32 %lhs, 2869996304 ; 0xab10ab10
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var2_2_fail_4(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_fail_4:
|
||||
define i32 @t2_const_var2_2_fail_1(i32 %lhs) {
|
||||
;CHECK: t2_const_var2_2_fail_1:
|
||||
;CHECK: movt
|
||||
%ret = add i32 %lhs, 279685904 ; 0x10abab10
|
||||
ret i32 %ret
|
||||
@ -125,9 +130,10 @@ define i32 @t2_const_var3_2_ok_1(i32 %lhs) {
|
||||
ret i32 %ret
|
||||
}
|
||||
|
||||
define i32 @t2_const_var3_2_fail_1(i32 %lhs) {
|
||||
;CHECK: t2_const_var3_2_fail_1:
|
||||
;CHECK: movt
|
||||
define i32 @t2_const_var3_2_ok_2(i32 %lhs) {
|
||||
;CHECK: t2_const_var3_2_ok_2:
|
||||
;CHECK: #2097152
|
||||
;CHECK: #1843200
|
||||
%ret = add i32 %lhs, 3940352 ; 0b00000000001111000010000000000000
|
||||
ret i32 %ret
|
||||
}
|
||||
|
@ -55,10 +55,10 @@ define i32 @t2MOVTi16_test_3(i32 %a) {
|
||||
|
||||
define i32 @t2MOVTi16_test_nomatch_1(i32 %a) {
|
||||
; CHECK: t2MOVTi16_test_nomatch_1:
|
||||
; CHECK: movw r1, #16384
|
||||
; CHECK-NEXT: movt r1, #154
|
||||
; CHECK: #8388608
|
||||
; CHECK: movw r1, #65535
|
||||
; CHECK-NEXT: movt r1, #154
|
||||
; CHECK: #1720320
|
||||
%1 = shl i32 255, 8
|
||||
%2 = shl i32 1234, 8
|
||||
%3 = or i32 %1, 255 ; This give us 0xFFFF in %3
|
||||
|
Loading…
Reference in New Issue
Block a user