mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-24 11:42:57 +01:00
782b19da54
We can generate the actual instructions from the intrinsics without the need for pseudo-instructions. Also, since the intrinsics have a side- effect in a form of a store, attempt to optimize away loads from the store location. llvm-svn: 260690
104 lines
3.7 KiB
LLVM
104 lines
3.7 KiB
LLVM
; RUN: llc -march=hexagon < %s | FileCheck %s
|
|
; RUN: llc -march=hexagon -verify-machineinstrs=true < %s | FileCheck %s
|
|
; Test these 5 bitreverse store intrinsics:
|
|
; Q6_bitrev_store_update_D(inputLR, pDelay, nConvLength);
|
|
; Q6_bitrev_store_update_W(inputLR, pDelay, nConvLength);
|
|
; Q6_bitrev_store_update_HL(inputLR, pDelay, nConvLength);
|
|
; Q6_bitrev_store_update_HH(inputLR, pDelay, nConvLength);
|
|
; Q6_bitrev_store_update_B(inputLR, pDelay, nConvLength);
|
|
; producing these instructions:
|
|
; memd(r0++m0:brev) = r1:0
|
|
; memw(r0++m0:brev) = r0
|
|
; memh(r0++m0:brev) = r3
|
|
; memh(r0++m0:brev) = r3.h
|
|
; memb(r0++m0:brev) = r3
|
|
|
|
; ModuleID = 'brev_st.i'
|
|
target datalayout = "e-p:32:32:32-i64:64:64-i32:32:32-i16:16:16-i1:32:32-f64:64:64-f32:32:32-v64:64:64-v32:32:32-a0:0-n16:32"
|
|
target triple = "hexagon"
|
|
|
|
define i64 @foo(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind {
|
|
entry:
|
|
%conv = zext i16 %filtMemLen to i32
|
|
%shr2 = lshr i32 %conv, 1
|
|
%idxprom = sext i16 %filtMemIndex to i32
|
|
%arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom
|
|
%0 = bitcast i16* %arrayidx to i8*
|
|
%sub = sub i32 13, %shr2
|
|
%shl = shl i32 1, %sub
|
|
; CHECK: memd(r{{[0-9]*}} ++ m{{[0-1]}}:brev)
|
|
%1 = tail call i8* @llvm.hexagon.brev.std(i8* %0, i64 undef, i32 %shl)
|
|
ret i64 0
|
|
}
|
|
|
|
declare i8* @llvm.hexagon.brev.std(i8*, i64, i32) nounwind
|
|
|
|
define i32 @foo1(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind {
|
|
entry:
|
|
%conv = zext i16 %filtMemLen to i32
|
|
%shr1 = lshr i32 %conv, 1
|
|
%idxprom = sext i16 %filtMemIndex to i32
|
|
%arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom
|
|
%0 = bitcast i16* %arrayidx to i8*
|
|
%sub = sub i32 14, %shr1
|
|
%shl = shl i32 1, %sub
|
|
; CHECK: memw(r{{[0-9]*}} ++ m{{[0-1]}}:brev)
|
|
%1 = tail call i8* @llvm.hexagon.brev.stw(i8* %0, i32 undef, i32 %shl)
|
|
ret i32 0
|
|
}
|
|
|
|
declare i8* @llvm.hexagon.brev.stw(i8*, i32, i32) nounwind
|
|
|
|
define signext i16 @foo2(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind {
|
|
entry:
|
|
%conv = zext i16 %filtMemLen to i32
|
|
%shr2 = lshr i32 %conv, 1
|
|
%idxprom = sext i16 %filtMemIndex to i32
|
|
%arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom
|
|
%0 = bitcast i16* %arrayidx to i8*
|
|
%sub = sub i32 15, %shr2
|
|
%shl = shl i32 1, %sub
|
|
; CHECK: memh(r{{[0-9]*}} ++ m{{[0-1]}}:brev)
|
|
%1 = tail call i8* @llvm.hexagon.brev.sth(i8* %0, i32 0, i32 %shl)
|
|
ret i16 0
|
|
}
|
|
|
|
declare i8* @llvm.hexagon.brev.sth(i8*, i32, i32) nounwind
|
|
|
|
define signext i16 @foo3(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind {
|
|
entry:
|
|
%conv = zext i16 %filtMemLen to i32
|
|
%shr2 = lshr i32 %conv, 1
|
|
%idxprom = sext i16 %filtMemIndex to i32
|
|
%arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom
|
|
%0 = bitcast i16* %arrayidx to i8*
|
|
%sub = sub i32 15, %shr2
|
|
%shl = shl i32 1, %sub
|
|
; CHECK: memh(r{{[0-9]*}} ++ m{{[0-1]}}:brev){{ *}}={{ *}}r{{[0-9]*}}.h
|
|
%1 = tail call i8* @llvm.hexagon.brev.sthhi(i8* %0, i32 0, i32 %shl)
|
|
ret i16 0
|
|
}
|
|
|
|
declare i8* @llvm.hexagon.brev.sthhi(i8*, i32, i32) nounwind
|
|
|
|
define zeroext i8 @foo5(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind {
|
|
entry:
|
|
%conv = zext i16 %filtMemLen to i32
|
|
%shr2 = lshr i32 %conv, 1
|
|
%idxprom = sext i16 %filtMemIndex to i32
|
|
%arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom
|
|
%0 = bitcast i16* %arrayidx to i8*
|
|
%sub = sub nsw i32 16, %shr2
|
|
; CHECK: memb(r{{[0-9]*}} ++ m{{[0-1]}}:brev)
|
|
%shl = shl i32 1, %sub
|
|
%1 = tail call i8* @llvm.hexagon.brev.stb(i8* %0, i32 0, i32 %shl)
|
|
ret i8 0
|
|
}
|
|
|
|
declare i8* @llvm.hexagon.brev.stb(i8*, i32, i32) nounwind
|
|
|
|
!0 = !{!"omnipotent char", !1}
|
|
!1 = !{!"Simple C/C++ TBAA"}
|
|
!2 = !{!"int", !0}
|
|
!3 = !{!"short", !0}
|