Merging r351753: (2bebfebe) · Commits · llvm-doe / llvm-project

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

+11 −5

Original line number	Diff line number	Diff line
		@@ -16214,18 +16214,24 @@ static SDValue reduceBuildVecToShuffleWithZero(SDNode *BV, SelectionDAG &DAG) {
		// The build vector contains some number of undef elements and exactly
		// one other element. That other element must be a zero-extended scalar
		// extracted from a vector at a constant index to turn this into a shuffle.
		// Also, require that the build vector does not implicitly truncate/extend
		// its elements.
		// TODO: This could be enhanced to allow ANY_EXTEND as well as ZERO_EXTEND.
		EVT VT = BV->getValueType(0);
		SDValue Zext = BV->getOperand(ZextElt);
		if (Zext.getOpcode() != ISD::ZERO_EXTEND \|\| !Zext.hasOneUse() \|\|
		Zext.getOperand(0).getOpcode() != ISD::EXTRACT_VECTOR_ELT \|\|
		!isa<ConstantSDNode>(Zext.getOperand(0).getOperand(1)))
		!isa<ConstantSDNode>(Zext.getOperand(0).getOperand(1)) \|\|
		Zext.getValueSizeInBits() != VT.getScalarSizeInBits())
		return SDValue();

		// The zero-extend must be a multiple of the source size.
		// The zero-extend must be a multiple of the source size, and we must be
		// building a vector of the same size as the source of the extract element.
		SDValue Extract = Zext.getOperand(0);
		unsigned DestSize = Zext.getValueSizeInBits();
		unsigned SrcSize = Extract.getValueSizeInBits();
		if (DestSize % SrcSize != 0)
		if (DestSize % SrcSize != 0 \|\|
		Extract.getOperand(0).getValueSizeInBits() != VT.getSizeInBits())
		return SDValue();

		// Create a shuffle mask that will combine the extracted element with zeros
		@@ -16260,7 +16266,7 @@ static SDValue reduceBuildVecToShuffleWithZero(SDNode *BV, SelectionDAG &DAG) {
		SDValue ZeroVec = DAG.getConstant(0, DL, VecVT);
		SDValue Shuf = DAG.getVectorShuffle(VecVT, DL, Extract.getOperand(0), ZeroVec,
		ShufMask);
		return DAG.getBitcast(BV->getValueType(0), Shuf);
		return DAG.getBitcast(VT, Shuf);
		}

		// Check to see if this is a BUILD_VECTOR of a bunch of EXTRACT_VECTOR_ELT

llvm/test/CodeGen/AArch64/build-vector-extract.ll

0 → 100644

+22 −0

Original line number	Diff line number	Diff line
		; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
		; RUN: llc < %s -mtriple=aarch64-- \| FileCheck %s

		; This would crash because we did not expect to create
		; a shuffle for a vector where the source operand is
		; not the same size as the result.
		; TODO: Should we handle this pattern? Ie, is moving to/from
		; registers the optimal code?

		define <4 x i32> @larger_bv_than_source(<4 x i16> %t0) {
		; CHECK-LABEL: larger_bv_than_source:
		; CHECK: // %bb.0:
		; CHECK-NEXT: // kill: def $d0 killed $d0 def $q0
		; CHECK-NEXT: umov w8, v0.h[2]
		; CHECK-NEXT: fmov s0, w8
		; CHECK-NEXT: ret
		%t1 = extractelement <4 x i16> %t0, i32 2
		%vgetq_lane = zext i16 %t1 to i32
		%t2 = insertelement <4 x i32> undef, i32 %vgetq_lane, i64 0
		ret <4 x i32> %t2
		}