diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp index ecbd24febc6..73c4a1cabf5 100644 --- a/lib/Target/X86/X86ISelLowering.cpp +++ b/lib/Target/X86/X86ISelLowering.cpp @@ -17320,8 +17320,7 @@ static SDValue PerformAndCombine(SDNode *N, SelectionDAG &DAG, assert(N001.getValueType() == MVT::i8 && "unexpected type"); ConstantSDNode *C = dyn_cast(N00.getOperand(0)); if (C && C->getZExtValue() == 1) - return DAG.getNode(X86ISD::BZHI, DL, VT, N1, - DAG.getNode(ISD::ZERO_EXTEND, DL, VT, N001)); + return DAG.getNode(X86ISD::BZHI, DL, VT, N1, N001); } } @@ -17333,8 +17332,7 @@ static SDValue PerformAndCombine(SDNode *N, SelectionDAG &DAG, assert(N101.getValueType() == MVT::i8 && "unexpected type"); ConstantSDNode *C = dyn_cast(N10.getOperand(0)); if (C && C->getZExtValue() == 1) - return DAG.getNode(X86ISD::BZHI, DL, VT, N0, - DAG.getNode(ISD::ZERO_EXTEND, DL, VT, N101)); + return DAG.getNode(X86ISD::BZHI, DL, VT, N0, N101); } } } diff --git a/lib/Target/X86/X86InstrInfo.td b/lib/Target/X86/X86InstrInfo.td index fca7d4cea65..869b9e0dfe3 100644 --- a/lib/Target/X86/X86InstrInfo.td +++ b/lib/Target/X86/X86InstrInfo.td @@ -252,7 +252,7 @@ def X86and_flag : SDNode<"X86ISD::AND", SDTBinaryArithWithFlags, def X86blsi : SDNode<"X86ISD::BLSI", SDTIntUnaryOp>; def X86blsmsk : SDNode<"X86ISD::BLSMSK", SDTIntUnaryOp>; def X86blsr : SDNode<"X86ISD::BLSR", SDTIntUnaryOp>; -def X86bzhi : SDNode<"X86ISD::BZHI", SDTIntBinOp>; +def X86bzhi : SDNode<"X86ISD::BZHI", SDTIntShiftOp>; def X86mul_imm : SDNode<"X86ISD::MUL_IMM", SDTIntBinOp>; @@ -1856,14 +1856,18 @@ let Predicates = [HasBMI2], Defs = [EFLAGS] in { int_x86_bmi_bzhi_64, loadi64>, VEX_W; } -def : Pat<(X86bzhi GR32:$src1, GR32:$src2), - (BZHI32rr GR32:$src1, GR32:$src2)>; -def : Pat<(X86bzhi (loadi32 addr:$src1), GR32:$src2), - (BZHI32rm addr:$src1, GR32:$src2)>; -def : Pat<(X86bzhi GR64:$src1, GR64:$src2), - (BZHI64rr GR64:$src1, GR64:$src2)>; -def : Pat<(X86bzhi (loadi64 addr:$src1), GR64:$src2), - (BZHI64rm addr:$src1, GR64:$src2)>; +def : Pat<(X86bzhi GR32:$src1, GR8:$src2), + (BZHI32rr GR32:$src1, + (INSERT_SUBREG (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>; +def : Pat<(X86bzhi (loadi32 addr:$src1), GR8:$src2), + (BZHI32rm addr:$src1, + (INSERT_SUBREG (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>; +def : Pat<(X86bzhi GR64:$src1, GR8:$src2), + (BZHI64rr GR64:$src1, + (INSERT_SUBREG (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>; +def : Pat<(X86bzhi (loadi64 addr:$src1), GR8:$src2), + (BZHI64rm addr:$src1, + (INSERT_SUBREG (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>; multiclass bmi_pdep_pext