mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-10-19 11:02:59 +02:00
Fix *_EXTEND_VECTOR_INREG legalization
Summary: While promoting *_EXTEND_VECTOR_INREG nodes whose inputs are already promoted, perform the appropriate sign extension for the promoted node before doing the *_EXTEND_VECTOR_INREG operation. If not, the undefined high-order bits of the promoted operand may (a) be garbage inc ase of zext) or (b) contribute the wrong sign-bit (in case of sext) Updated the promote-vec3.ll test after this change. The diff shows explicit zeroing in case of zext and intermediate sign extension in case of sext. Reviewers: RKSimon Subscribers: llvm-commits, srhines Differential Revision: https://reviews.llvm.org/D25790 llvm-svn: 284752
This commit is contained in:
parent
aaf8c094e3
commit
4cd983fcee
@ -3349,11 +3349,27 @@ SDValue DAGTypeLegalizer::PromoteIntRes_EXTEND_VECTOR_INREG(SDNode *N) {
|
||||
|
||||
SDLoc dl(N);
|
||||
|
||||
// For operands whose TypeAction is to promote, the promoted node to construct
|
||||
// a new *_EXTEND_VECTOR_INREG node.
|
||||
// For operands whose TypeAction is to promote, extend the promoted node
|
||||
// appropriately (ZERO_EXTEND or SIGN_EXTEND) from the original pre-promotion
|
||||
// type, and then construct a new *_EXTEND_VECTOR_INREG node to the promote-to
|
||||
// type..
|
||||
if (getTypeAction(N->getOperand(0).getValueType())
|
||||
== TargetLowering::TypePromoteInteger) {
|
||||
SDValue Promoted = GetPromotedInteger(N->getOperand(0));
|
||||
SDValue Promoted;
|
||||
|
||||
switch(N->getOpcode()) {
|
||||
case ISD::SIGN_EXTEND_VECTOR_INREG:
|
||||
Promoted = SExtPromotedInteger(N->getOperand(0));
|
||||
break;
|
||||
case ISD::ZERO_EXTEND_VECTOR_INREG:
|
||||
Promoted = ZExtPromotedInteger(N->getOperand(0));
|
||||
break;
|
||||
case ISD::ANY_EXTEND_VECTOR_INREG:
|
||||
Promoted = GetPromotedInteger(N->getOperand(0));
|
||||
break;
|
||||
default:
|
||||
llvm_unreachable("Node has unexpected Opcode");
|
||||
}
|
||||
return DAG.getNode(N->getOpcode(), dl, NVT, Promoted);
|
||||
}
|
||||
|
||||
|
@ -9,16 +9,17 @@ define <3 x i16> @zext_i8(<3 x i8>) {
|
||||
; SSE3-LABEL: zext_i8:
|
||||
; SSE3: # BB#0:
|
||||
; SSE3-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
||||
; SSE3-NEXT: pinsrw $0, %eax, %xmm0
|
||||
; SSE3-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
||||
; SSE3-NEXT: pinsrw $1, %eax, %xmm0
|
||||
; SSE3-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
||||
; SSE3-NEXT: pinsrw $2, %eax, %xmm0
|
||||
; SSE3-NEXT: pxor %xmm0, %xmm0
|
||||
; SSE3-NEXT: pxor %xmm1, %xmm1
|
||||
; SSE3-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[3],xmm1[3]
|
||||
; SSE3-NEXT: movd %xmm0, %eax
|
||||
; SSE3-NEXT: pextrw $2, %xmm0, %edx
|
||||
; SSE3-NEXT: pextrw $4, %xmm0, %ecx
|
||||
; SSE3-NEXT: pinsrw $0, %eax, %xmm1
|
||||
; SSE3-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
||||
; SSE3-NEXT: pinsrw $1, %eax, %xmm1
|
||||
; SSE3-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
||||
; SSE3-NEXT: pinsrw $2, %eax, %xmm1
|
||||
; SSE3-NEXT: punpcklwd {{.*#+}} xmm1 = xmm1[0],xmm0[0],xmm1[1],xmm0[1],xmm1[2],xmm0[2],xmm1[3],xmm0[3]
|
||||
; SSE3-NEXT: movd %xmm1, %eax
|
||||
; SSE3-NEXT: pextrw $2, %xmm1, %edx
|
||||
; SSE3-NEXT: pextrw $4, %xmm1, %ecx
|
||||
; SSE3-NEXT: # kill: %AX<def> %AX<kill> %EAX<kill>
|
||||
; SSE3-NEXT: # kill: %DX<def> %DX<kill> %EDX<kill>
|
||||
; SSE3-NEXT: # kill: %CX<def> %CX<kill> %ECX<kill>
|
||||
@ -78,6 +79,8 @@ define <3 x i16> @sext_i8(<3 x i8>) {
|
||||
; SSE3-NEXT: pinsrw $1, %eax, %xmm0
|
||||
; SSE3-NEXT: movzbl {{[0-9]+}}(%esp), %eax
|
||||
; SSE3-NEXT: pinsrw $2, %eax, %xmm0
|
||||
; SSE3-NEXT: psllw $8, %xmm0
|
||||
; SSE3-NEXT: psraw $8, %xmm0
|
||||
; SSE3-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0,0,1,1,2,2,3,3]
|
||||
; SSE3-NEXT: psrad $16, %xmm0
|
||||
; SSE3-NEXT: movd %xmm0, %eax
|
||||
|
Loading…
Reference in New Issue
Block a user