mirror of
https://github.com/intel/llvm.git
synced 2026-01-25 10:55:58 +08:00
[SelectionDAG] Add support for vector demandedelts in SRA opcodes
llvm-svn: 286461
This commit is contained in:
@@ -2265,7 +2265,8 @@ void SelectionDAG::computeKnownBits(SDValue Op, APInt &KnownZero,
|
||||
break;
|
||||
case ISD::SRA:
|
||||
if (const APInt *ShAmt = getValidShiftAmountConstant(Op)) {
|
||||
computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth + 1);
|
||||
computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, DemandedElts,
|
||||
Depth + 1);
|
||||
KnownZero = KnownZero.lshr(*ShAmt);
|
||||
KnownOne = KnownOne.lshr(*ShAmt);
|
||||
// If we know the value of the sign bit, then we know it is copied across
|
||||
|
||||
@@ -156,18 +156,12 @@ define <4 x i32> @knownbits_mask_shl_shuffle_lshr(<4 x i32> %a0) nounwind {
|
||||
define <4 x i32> @knownbits_mask_ashr_shuffle_lshr(<4 x i32> %a0) nounwind {
|
||||
; X32-LABEL: knownbits_mask_ashr_shuffle_lshr:
|
||||
; X32: # BB#0:
|
||||
; X32-NEXT: vpand {{\.LCPI.*}}, %xmm0, %xmm0
|
||||
; X32-NEXT: vpsrad $15, %xmm0, %xmm0
|
||||
; X32-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[0,0,3,3]
|
||||
; X32-NEXT: vpsrld $30, %xmm0, %xmm0
|
||||
; X32-NEXT: vxorps %xmm0, %xmm0, %xmm0
|
||||
; X32-NEXT: retl
|
||||
;
|
||||
; X64-LABEL: knownbits_mask_ashr_shuffle_lshr:
|
||||
; X64: # BB#0:
|
||||
; X64-NEXT: vpand {{.*}}(%rip), %xmm0, %xmm0
|
||||
; X64-NEXT: vpsrad $15, %xmm0, %xmm0
|
||||
; X64-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[0,0,3,3]
|
||||
; X64-NEXT: vpsrld $30, %xmm0, %xmm0
|
||||
; X64-NEXT: vxorps %xmm0, %xmm0, %xmm0
|
||||
; X64-NEXT: retq
|
||||
%1 = and <4 x i32> %a0, <i32 131071, i32 -1, i32 -1, i32 131071>
|
||||
%2 = ashr <4 x i32> %1, <i32 15, i32 15, i32 15, i32 15>
|
||||
|
||||
Reference in New Issue
Block a user