1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2025-01-31 20:51:52 +01:00

[Hexagon] Bit-based instruction simplification

Analyze bit patterns of operands and values of instructions to perform
various simplifications, dead/redundant code elimination, etc.

llvm-svn: 250868
This commit is contained in:
Krzysztof Parzyszek 2015-10-20 22:57:13 +00:00
parent 52f05db67a
commit 4625bb8dfb
9 changed files with 2930 additions and 4 deletions

View File

@ -14,6 +14,7 @@ add_public_tablegen_target(HexagonCommonTableGen)
add_llvm_target(HexagonCodeGen
BitTracker.cpp
HexagonAsmPrinter.cpp
HexagonBitSimplify.cpp
HexagonBitTracker.cpp
HexagonCFGOptimizer.cpp
HexagonCommonGEP.cpp

File diff suppressed because it is too large Load Diff

View File

@ -62,6 +62,12 @@ static cl::opt<bool> EnableGenPred("hexagon-gen-pred", cl::init(true),
static cl::opt<bool> DisableHSDR("disable-hsdr", cl::init(false), cl::Hidden,
cl::desc("Disable splitting double registers"));
static cl::opt<bool> EnableBitSimplify("hexagon-bit", cl::init(true),
cl::Hidden, cl::desc("Bit simplification"));
static cl::opt<bool> EnableLoopResched("hexagon-loop-resched", cl::init(true),
cl::Hidden, cl::desc("Loop rescheduling"));
/// HexagonTargetMachineModule - Note that this is used on hosts that
/// cannot link in a library unless there are references into the
/// library. In particular, it seems that it is not possible to get
@ -84,6 +90,7 @@ SchedCustomRegistry("hexagon", "Run Hexagon's custom scheduler",
createVLIWMachineSched);
namespace llvm {
FunctionPass *createHexagonBitSimplify();
FunctionPass *createHexagonCallFrameInformation();
FunctionPass *createHexagonCFGOptimizer();
FunctionPass *createHexagonCommonGEP();
@ -99,6 +106,7 @@ namespace llvm {
FunctionPass *createHexagonHardwareLoops();
FunctionPass *createHexagonISelDag(HexagonTargetMachine &TM,
CodeGenOpt::Level OptLevel);
FunctionPass *createHexagonLoopRescheduling();
FunctionPass *createHexagonNewValueJump();
FunctionPass *createHexagonOptimizeSZextends();
FunctionPass *createHexagonPacketizer();
@ -223,9 +231,15 @@ bool HexagonPassConfig::addInstSelector() {
// Create logical operations on predicate registers.
if (EnableGenPred)
addPass(createHexagonGenPredicate(), false);
// Rotate loops to expose bit-simplification opportunities.
if (EnableLoopResched)
addPass(createHexagonLoopRescheduling(), false);
// Split double registers.
if (!DisableHSDR)
addPass(createHexagonSplitDoubleRegs());
// Bit simplification.
if (EnableBitSimplify)
addPass(createHexagonBitSimplify(), false);
addPass(createHexagonPeephole());
printAndVerify("After hexagon peephole pass");
if (EnableGenInsert)

View File

@ -1,4 +1,4 @@
; RUN: llc -march=hexagon -disable-hsdr -hexagon-expand-condsets=0 < %s | FileCheck %s
; RUN: llc -march=hexagon -disable-hsdr -hexagon-expand-condsets=0 -hexagon-bit=0 < %s | FileCheck %s
; CHECK: r{{[0-9]+:[0-9]+}} = #1
; CHECK: r{{[0-9]+:[0-9]+}} = #0

View File

@ -0,0 +1,53 @@
; RUN: llc < %s | FileCheck %s
target datalayout = "e-m:e-p:32:32-i1:32-i64:64-a:0-v32:32-n16:32"
target triple = "hexagon"
; CHECK-LABEL: test1:
; CHECK: r0 = ##1073741824
define i32 @test1() #0 {
entry:
%0 = tail call i32 @llvm.hexagon.S2.asr.i.r.rnd(i32 2147483647, i32 0)
ret i32 %0
}
; CHECK-LABEL: test2:
; CHECK: r0 = ##1073741824
define i32 @test2() #0 {
entry:
%0 = tail call i32 @llvm.hexagon.S2.asr.i.r.rnd.goodsyntax(i32 2147483647, i32 1)
ret i32 %0
}
; CHECK-LABEL: test3:
; CHECK: r1:0 = #1
define i64 @test3() #0 {
entry:
%0 = tail call i64 @llvm.hexagon.S4.extractp(i64 -1, i32 63, i32 63)
ret i64 %0
}
; CHECK-LABEL: test4:
; CHECK: r0 = #1
define i32 @test4() #0 {
entry:
%0 = tail call i32 @llvm.hexagon.S4.extract(i32 -1, i32 31, i32 31)
ret i32 %0
}
; CHECK-LABEL: test5:
; CHECK: r0 = ##-1073741569
define i32 @test5() #0 {
entry:
%0 = tail call i32 @llvm.hexagon.S4.subi.lsr.ri(i32 255, i32 -2147483648, i32 1)
ret i32 %0
}
declare i32 @llvm.hexagon.S2.asr.i.r.rnd(i32, i32) #0
declare i32 @llvm.hexagon.S2.asr.i.r.rnd.goodsyntax(i32, i32) #0
declare i64 @llvm.hexagon.S4.extractp(i64, i32, i32) #0
declare i32 @llvm.hexagon.S4.extract(i32, i32, i32) #0
declare i32 @llvm.hexagon.S4.subi.lsr.ri(i32, i32, i32) #0
attributes #0 = { nounwind readnone }

View File

@ -0,0 +1,80 @@
; RUN: llc < %s | FileCheck %s
; CHECK-DAG: memh(r{{[0-9]+}}+#0) = r{{[0-9]+}}
; CHECK-DAG: memh(r{{[0-9]+}}+#2) = r{{[0-9]+}}.h
; CHECK-DAG: memh(r{{[0-9]+}}+#4) = r{{[0-9]+}}
; CHECK-DAG: memh(r{{[0-9]+}}+#6) = r{{[0-9]+}}.h
target datalayout = "e-m:e-p:32:32-i1:32-i64:64-a:0-v32:32-n16:32"
target triple = "hexagon"
; Function Attrs: nounwind
define void @foo(i64* nocapture readonly %r64, i16 zeroext %n, i16 zeroext %s, i64* nocapture %p64) #0 {
entry:
%conv = zext i16 %n to i32
%cmp = icmp eq i16 %n, 0
br i1 %cmp, label %for.end, label %for.body.preheader
for.body.preheader: ; preds = %entry
%0 = load i64, i64* %r64, align 8, !tbaa !1
%v.sroa.0.0.extract.trunc = trunc i64 %0 to i16
%v.sroa.4.0.extract.shift = lshr i64 %0, 16
%v.sroa.4.0.extract.trunc = trunc i64 %v.sroa.4.0.extract.shift to i16
%v.sroa.5.0.extract.shift = lshr i64 %0, 32
%v.sroa.5.0.extract.trunc = trunc i64 %v.sroa.5.0.extract.shift to i16
%v.sroa.6.0.extract.shift = lshr i64 %0, 48
%v.sroa.6.0.extract.trunc = trunc i64 %v.sroa.6.0.extract.shift to i16
%1 = bitcast i64* %p64 to i16*
%conv2 = zext i16 %s to i32
%add.ptr = getelementptr inbounds i16, i16* %1, i32 %conv2
%add.ptr.sum = add nuw nsw i32 %conv2, 1
%add.ptr3 = getelementptr inbounds i16, i16* %1, i32 %add.ptr.sum
%add.ptr.sum50 = add nuw nsw i32 %conv2, 2
%add.ptr4 = getelementptr inbounds i16, i16* %1, i32 %add.ptr.sum50
%add.ptr.sum51 = add nuw nsw i32 %conv2, 3
%add.ptr5 = getelementptr inbounds i16, i16* %1, i32 %add.ptr.sum51
br label %for.body
for.body: ; preds = %for.body.preheader, %for.body
%add.ptr11.phi = phi i16* [ %add.ptr11.inc, %for.body ], [ %add.ptr, %for.body.preheader ]
%add.ptr16.phi = phi i16* [ %add.ptr16.inc, %for.body ], [ %add.ptr3, %for.body.preheader ]
%add.ptr21.phi = phi i16* [ %add.ptr21.inc, %for.body ], [ %add.ptr4, %for.body.preheader ]
%add.ptr26.phi = phi i16* [ %add.ptr26.inc, %for.body ], [ %add.ptr5, %for.body.preheader ]
%i.058.pmt = phi i32 [ %inc.pmt, %for.body ], [ 0, %for.body.preheader ]
%v.sroa.0.157 = phi i16 [ %v.sroa.0.0.extract.trunc34, %for.body ], [ %v.sroa.0.0.extract.trunc, %for.body.preheader ]
%v.sroa.4.156 = phi i16 [ %v.sroa.4.0.extract.trunc36, %for.body ], [ %v.sroa.4.0.extract.trunc, %for.body.preheader ]
%v.sroa.5.155 = phi i16 [ %v.sroa.5.0.extract.trunc38, %for.body ], [ %v.sroa.5.0.extract.trunc, %for.body.preheader ]
%v.sroa.6.154 = phi i16 [ %v.sroa.6.0.extract.trunc40, %for.body ], [ %v.sroa.6.0.extract.trunc, %for.body.preheader ]
%q64.153.pn = phi i64* [ %q64.153, %for.body ], [ %r64, %for.body.preheader ]
%q64.153 = getelementptr inbounds i64, i64* %q64.153.pn, i32 1
store i16 %v.sroa.0.157, i16* %add.ptr11.phi, align 2, !tbaa !5
store i16 %v.sroa.4.156, i16* %add.ptr16.phi, align 2, !tbaa !5
store i16 %v.sroa.5.155, i16* %add.ptr21.phi, align 2, !tbaa !5
store i16 %v.sroa.6.154, i16* %add.ptr26.phi, align 2, !tbaa !5
%2 = load i64, i64* %q64.153, align 8, !tbaa !1
%v.sroa.0.0.extract.trunc34 = trunc i64 %2 to i16
%v.sroa.4.0.extract.shift35 = lshr i64 %2, 16
%v.sroa.4.0.extract.trunc36 = trunc i64 %v.sroa.4.0.extract.shift35 to i16
%v.sroa.5.0.extract.shift37 = lshr i64 %2, 32
%v.sroa.5.0.extract.trunc38 = trunc i64 %v.sroa.5.0.extract.shift37 to i16
%v.sroa.6.0.extract.shift39 = lshr i64 %2, 48
%v.sroa.6.0.extract.trunc40 = trunc i64 %v.sroa.6.0.extract.shift39 to i16
%inc.pmt = add i32 %i.058.pmt, 1
%cmp8 = icmp slt i32 %inc.pmt, %conv
%add.ptr11.inc = getelementptr i16, i16* %add.ptr11.phi, i32 4
%add.ptr16.inc = getelementptr i16, i16* %add.ptr16.phi, i32 4
%add.ptr21.inc = getelementptr i16, i16* %add.ptr21.phi, i32 4
%add.ptr26.inc = getelementptr i16, i16* %add.ptr26.phi, i32 4
br i1 %cmp8, label %for.body, label %for.end
for.end: ; preds = %for.body, %entry
ret void
}
attributes #0 = { nounwind }
!1 = !{!2, !2, i64 0}
!2 = !{!"long long", !3, i64 0}
!3 = !{!"omnipotent char", !4, i64 0}
!4 = !{!"Simple C/C++ TBAA"}
!5 = !{!6, !6, i64 0}
!6 = !{!"short", !3, i64 0}

View File

@ -1,4 +1,4 @@
; RUN: llc -march=hexagon -mcpu=hexagonv5 < %s | FileCheck %s
; RUN: llc -march=hexagon -mcpu=hexagonv5 -hexagon-bit=0 < %s | FileCheck %s
; Optimized bitwise operations.
define i32 @my_clrbit(i32 %x) nounwind {

View File

@ -1,4 +1,4 @@
; RUN: llc -mtriple=hexagon-unknown-elf -mcpu=hexagonv5 < %s | FileCheck %s
; RUN: llc -mtriple=hexagon-unknown-elf -mcpu=hexagonv5 -hexagon-bit=0 < %s | FileCheck %s
; Optimize fabsf to clrbit in V5.
; CHECK: r{{[0-9]+}} = clrbit(r{{[0-9]+}}, #31)

View File

@ -1,4 +1,4 @@
; RUN: llc -march=hexagon -disable-hsdr -hexagon-expand-condsets=0 < %s | FileCheck %s
; RUN: llc -march=hexagon -disable-hsdr -hexagon-expand-condsets=0 -hexagon-bit=0 < %s | FileCheck %s
; CHECK: r{{[0-9]+:[0-9]+}} = #1
; CHECK: r{{[0-9]+:[0-9]+}} = #0