-
Notifications
You must be signed in to change notification settings - Fork 14.5k
[VPlan] Add VPExpressionRecipe, replacing extended reduction recipes. #144281
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 3 commits
736357e
3c3f9e4
1b7bf4b
e8dc289
9688a79
741ba42
ac1a2dc
3be870c
d87843c
86b1216
285ac34
1d717d2
201c5d7
1bae34e
42359e5
6b85231
3908cd6
c70bba4
4bfef50
4ed3f43
a661de8
8af8f33
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change | ||||||
---|---|---|---|---|---|---|---|---|
|
@@ -525,14 +525,13 @@ class VPSingleDefRecipe : public VPRecipeBase, public VPValue { | |||||||
|
||||||||
static inline bool classof(const VPRecipeBase *R) { | ||||||||
switch (R->getVPDefID()) { | ||||||||
case VPRecipeBase::VPBundleSC: | ||||||||
case VPRecipeBase::VPDerivedIVSC: | ||||||||
case VPRecipeBase::VPEVLBasedIVPHISC: | ||||||||
case VPRecipeBase::VPExpandSCEVSC: | ||||||||
case VPRecipeBase::VPInstructionSC: | ||||||||
case VPRecipeBase::VPReductionEVLSC: | ||||||||
case VPRecipeBase::VPReductionSC: | ||||||||
case VPRecipeBase::VPMulAccumulateReductionSC: | ||||||||
case VPRecipeBase::VPExtendedReductionSC: | ||||||||
case VPRecipeBase::VPReplicateSC: | ||||||||
case VPRecipeBase::VPScalarIVStepsSC: | ||||||||
case VPRecipeBase::VPVectorPointerSC: | ||||||||
|
@@ -852,9 +851,7 @@ struct VPRecipeWithIRFlags : public VPSingleDefRecipe, public VPIRFlags { | |||||||
R->getVPDefID() == VPRecipeBase::VPReductionEVLSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPReplicateSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPVectorEndPointerSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPVectorPointerSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPExtendedReductionSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPMulAccumulateReductionSC; | ||||||||
R->getVPDefID() == VPRecipeBase::VPVectorPointerSC; | ||||||||
} | ||||||||
|
||||||||
static inline bool classof(const VPUser *U) { | ||||||||
|
@@ -2432,28 +2429,6 @@ class VPReductionRecipe : public VPRecipeWithIRFlags { | |||||||
setUnderlyingValue(I); | ||||||||
} | ||||||||
|
||||||||
/// For VPExtendedReductionRecipe. | ||||||||
/// Note that the debug location is from the extend. | ||||||||
VPReductionRecipe(const unsigned char SC, const RecurKind RdxKind, | ||||||||
ArrayRef<VPValue *> Operands, VPValue *CondOp, | ||||||||
bool IsOrdered, DebugLoc DL) | ||||||||
: VPRecipeWithIRFlags(SC, Operands, DL), RdxKind(RdxKind), | ||||||||
IsOrdered(IsOrdered), IsConditional(CondOp) { | ||||||||
if (CondOp) | ||||||||
addOperand(CondOp); | ||||||||
} | ||||||||
|
||||||||
/// For VPMulAccumulateReductionRecipe. | ||||||||
/// Note that the NUW/NSW flags and the debug location are from the Mul. | ||||||||
VPReductionRecipe(const unsigned char SC, const RecurKind RdxKind, | ||||||||
ArrayRef<VPValue *> Operands, VPValue *CondOp, | ||||||||
bool IsOrdered, WrapFlagsTy WrapFlags, DebugLoc DL) | ||||||||
: VPRecipeWithIRFlags(SC, Operands, WrapFlags, DL), RdxKind(RdxKind), | ||||||||
IsOrdered(IsOrdered), IsConditional(CondOp) { | ||||||||
if (CondOp) | ||||||||
addOperand(CondOp); | ||||||||
} | ||||||||
|
||||||||
public: | ||||||||
VPReductionRecipe(RecurKind RdxKind, FastMathFlags FMFs, Instruction *I, | ||||||||
VPValue *ChainOp, VPValue *VecOp, VPValue *CondOp, | ||||||||
|
@@ -2479,9 +2454,7 @@ class VPReductionRecipe : public VPRecipeWithIRFlags { | |||||||
|
||||||||
static inline bool classof(const VPRecipeBase *R) { | ||||||||
return R->getVPDefID() == VPRecipeBase::VPReductionSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPReductionEVLSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPExtendedReductionSC || | ||||||||
R->getVPDefID() == VPRecipeBase::VPMulAccumulateReductionSC; | ||||||||
R->getVPDefID() == VPRecipeBase::VPReductionEVLSC; | ||||||||
} | ||||||||
|
||||||||
static inline bool classof(const VPUser *U) { | ||||||||
|
@@ -2620,190 +2593,6 @@ class VPReductionEVLRecipe : public VPReductionRecipe { | |||||||
} | ||||||||
}; | ||||||||
|
||||||||
/// A recipe to represent inloop extended reduction operations, performing a | ||||||||
/// reduction on a extended vector operand into a scalar value, and adding the | ||||||||
/// result to a chain. This recipe is abstract and needs to be lowered to | ||||||||
/// concrete recipes before codegen. The operands are {ChainOp, VecOp, | ||||||||
/// [Condition]}. | ||||||||
class VPExtendedReductionRecipe : public VPReductionRecipe { | ||||||||
/// Opcode of the extend for VecOp. | ||||||||
Instruction::CastOps ExtOp; | ||||||||
|
||||||||
/// The scalar type after extending. | ||||||||
Type *ResultTy; | ||||||||
|
||||||||
/// For cloning VPExtendedReductionRecipe. | ||||||||
VPExtendedReductionRecipe(VPExtendedReductionRecipe *ExtRed) | ||||||||
: VPReductionRecipe( | ||||||||
VPDef::VPExtendedReductionSC, ExtRed->getRecurrenceKind(), | ||||||||
{ExtRed->getChainOp(), ExtRed->getVecOp()}, ExtRed->getCondOp(), | ||||||||
ExtRed->isOrdered(), ExtRed->getDebugLoc()), | ||||||||
ExtOp(ExtRed->getExtOpcode()), ResultTy(ExtRed->getResultType()) { | ||||||||
transferFlags(*ExtRed); | ||||||||
setUnderlyingValue(ExtRed->getUnderlyingValue()); | ||||||||
} | ||||||||
|
||||||||
public: | ||||||||
VPExtendedReductionRecipe(VPReductionRecipe *R, VPWidenCastRecipe *Ext) | ||||||||
: VPReductionRecipe(VPDef::VPExtendedReductionSC, R->getRecurrenceKind(), | ||||||||
{R->getChainOp(), Ext->getOperand(0)}, R->getCondOp(), | ||||||||
R->isOrdered(), Ext->getDebugLoc()), | ||||||||
ExtOp(Ext->getOpcode()), ResultTy(Ext->getResultType()) { | ||||||||
assert((ExtOp == Instruction::CastOps::ZExt || | ||||||||
ExtOp == Instruction::CastOps::SExt) && | ||||||||
"VPExtendedReductionRecipe only supports zext and sext."); | ||||||||
|
||||||||
transferFlags(*Ext); | ||||||||
setUnderlyingValue(R->getUnderlyingValue()); | ||||||||
} | ||||||||
|
||||||||
~VPExtendedReductionRecipe() override = default; | ||||||||
|
||||||||
VPExtendedReductionRecipe *clone() override { | ||||||||
return new VPExtendedReductionRecipe(this); | ||||||||
} | ||||||||
|
||||||||
VP_CLASSOF_IMPL(VPDef::VPExtendedReductionSC); | ||||||||
|
||||||||
void execute(VPTransformState &State) override { | ||||||||
llvm_unreachable("VPExtendedReductionRecipe should be transform to " | ||||||||
"VPExtendedRecipe + VPReductionRecipe before execution."); | ||||||||
}; | ||||||||
|
||||||||
/// Return the cost of VPExtendedReductionRecipe. | ||||||||
InstructionCost computeCost(ElementCount VF, | ||||||||
VPCostContext &Ctx) const override; | ||||||||
|
||||||||
#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) | ||||||||
/// Print the recipe. | ||||||||
void print(raw_ostream &O, const Twine &Indent, | ||||||||
VPSlotTracker &SlotTracker) const override; | ||||||||
#endif | ||||||||
|
||||||||
/// The scalar type after extending. | ||||||||
Type *getResultType() const { return ResultTy; } | ||||||||
|
||||||||
/// Is the extend ZExt? | ||||||||
bool isZExt() const { return getExtOpcode() == Instruction::ZExt; } | ||||||||
|
||||||||
/// Get the opcode of the extend for VecOp. | ||||||||
Instruction::CastOps getExtOpcode() const { return ExtOp; } | ||||||||
}; | ||||||||
|
||||||||
/// A recipe to represent inloop MulAccumulateReduction operations, multiplying | ||||||||
/// the vector operands (which may be extended), performing a reduction.add on | ||||||||
/// the result, and adding the scalar result to a chain. This recipe is abstract | ||||||||
/// and needs to be lowered to concrete recipes before codegen. The operands are | ||||||||
/// {ChainOp, VecOp1, VecOp2, [Condition]}. | ||||||||
class VPMulAccumulateReductionRecipe : public VPReductionRecipe { | ||||||||
/// Opcode of the extend for VecOp1 and VecOp2. | ||||||||
Instruction::CastOps ExtOp; | ||||||||
|
||||||||
/// Non-neg flag of the extend recipe. | ||||||||
bool IsNonNeg = false; | ||||||||
|
||||||||
/// The scalar type after extending. | ||||||||
Type *ResultTy = nullptr; | ||||||||
|
||||||||
/// For cloning VPMulAccumulateReductionRecipe. | ||||||||
VPMulAccumulateReductionRecipe(VPMulAccumulateReductionRecipe *MulAcc) | ||||||||
: VPReductionRecipe( | ||||||||
VPDef::VPMulAccumulateReductionSC, MulAcc->getRecurrenceKind(), | ||||||||
{MulAcc->getChainOp(), MulAcc->getVecOp0(), MulAcc->getVecOp1()}, | ||||||||
MulAcc->getCondOp(), MulAcc->isOrdered(), | ||||||||
WrapFlagsTy(MulAcc->hasNoUnsignedWrap(), MulAcc->hasNoSignedWrap()), | ||||||||
MulAcc->getDebugLoc()), | ||||||||
ExtOp(MulAcc->getExtOpcode()), IsNonNeg(MulAcc->isNonNeg()), | ||||||||
ResultTy(MulAcc->getResultType()) { | ||||||||
transferFlags(*MulAcc); | ||||||||
setUnderlyingValue(MulAcc->getUnderlyingValue()); | ||||||||
} | ||||||||
|
||||||||
public: | ||||||||
VPMulAccumulateReductionRecipe(VPReductionRecipe *R, VPWidenRecipe *Mul, | ||||||||
VPWidenCastRecipe *Ext0, | ||||||||
VPWidenCastRecipe *Ext1, Type *ResultTy) | ||||||||
: VPReductionRecipe( | ||||||||
VPDef::VPMulAccumulateReductionSC, R->getRecurrenceKind(), | ||||||||
{R->getChainOp(), Ext0->getOperand(0), Ext1->getOperand(0)}, | ||||||||
R->getCondOp(), R->isOrdered(), | ||||||||
WrapFlagsTy(Mul->hasNoUnsignedWrap(), Mul->hasNoSignedWrap()), | ||||||||
R->getDebugLoc()), | ||||||||
ExtOp(Ext0->getOpcode()), ResultTy(ResultTy) { | ||||||||
assert(RecurrenceDescriptor::getOpcode(getRecurrenceKind()) == | ||||||||
Instruction::Add && | ||||||||
"The reduction instruction in MulAccumulateteReductionRecipe must " | ||||||||
"be Add"); | ||||||||
assert((ExtOp == Instruction::CastOps::ZExt || | ||||||||
ExtOp == Instruction::CastOps::SExt) && | ||||||||
"VPMulAccumulateReductionRecipe only supports zext and sext."); | ||||||||
setUnderlyingValue(R->getUnderlyingValue()); | ||||||||
// Only set the non-negative flag if the original recipe contains. | ||||||||
if (Ext0->hasNonNegFlag()) | ||||||||
IsNonNeg = Ext0->isNonNeg(); | ||||||||
} | ||||||||
|
||||||||
VPMulAccumulateReductionRecipe(VPReductionRecipe *R, VPWidenRecipe *Mul, | ||||||||
Type *ResultTy) | ||||||||
: VPReductionRecipe( | ||||||||
VPDef::VPMulAccumulateReductionSC, R->getRecurrenceKind(), | ||||||||
{R->getChainOp(), Mul->getOperand(0), Mul->getOperand(1)}, | ||||||||
R->getCondOp(), R->isOrdered(), | ||||||||
WrapFlagsTy(Mul->hasNoUnsignedWrap(), Mul->hasNoSignedWrap()), | ||||||||
R->getDebugLoc()), | ||||||||
ExtOp(Instruction::CastOps::CastOpsEnd), ResultTy(ResultTy) { | ||||||||
assert(RecurrenceDescriptor::getOpcode(getRecurrenceKind()) == | ||||||||
Instruction::Add && | ||||||||
"The reduction instruction in MulAccumulateReductionRecipe must be " | ||||||||
"Add"); | ||||||||
setUnderlyingValue(R->getUnderlyingValue()); | ||||||||
} | ||||||||
|
||||||||
~VPMulAccumulateReductionRecipe() override = default; | ||||||||
|
||||||||
VPMulAccumulateReductionRecipe *clone() override { | ||||||||
return new VPMulAccumulateReductionRecipe(this); | ||||||||
} | ||||||||
|
||||||||
VP_CLASSOF_IMPL(VPDef::VPMulAccumulateReductionSC); | ||||||||
|
||||||||
void execute(VPTransformState &State) override { | ||||||||
llvm_unreachable("VPMulAccumulateReductionRecipe should transform to " | ||||||||
"VPWidenCastRecipe + " | ||||||||
"VPWidenRecipe + VPReductionRecipe before execution"); | ||||||||
} | ||||||||
|
||||||||
/// Return the cost of VPMulAccumulateReductionRecipe. | ||||||||
InstructionCost computeCost(ElementCount VF, | ||||||||
VPCostContext &Ctx) const override; | ||||||||
|
||||||||
#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) | ||||||||
/// Print the recipe. | ||||||||
void print(raw_ostream &O, const Twine &Indent, | ||||||||
VPSlotTracker &SlotTracker) const override; | ||||||||
#endif | ||||||||
|
||||||||
Type *getResultType() const { return ResultTy; } | ||||||||
|
||||||||
/// The first vector value to be extended and reduced. | ||||||||
VPValue *getVecOp0() const { return getOperand(1); } | ||||||||
|
||||||||
/// The second vector value to be extended and reduced. | ||||||||
VPValue *getVecOp1() const { return getOperand(2); } | ||||||||
|
||||||||
/// Return true if this recipe contains extended operands. | ||||||||
bool isExtended() const { return ExtOp != Instruction::CastOps::CastOpsEnd; } | ||||||||
|
||||||||
/// Return the opcode of the extends for the operands. | ||||||||
Instruction::CastOps getExtOpcode() const { return ExtOp; } | ||||||||
|
||||||||
/// Return if the operands are zero-extended. | ||||||||
bool isZExt() const { return ExtOp == Instruction::CastOps::ZExt; } | ||||||||
|
||||||||
/// Return true if the operand extends have the non-negative flag. | ||||||||
bool isNonNeg() const { return IsNonNeg; } | ||||||||
}; | ||||||||
|
||||||||
/// VPReplicateRecipe replicates a given instruction producing multiple scalar | ||||||||
/// copies of the original scalar type, one per lane, instead of producing a | ||||||||
/// single copy of widened type for all lanes. If the instruction is known to be | ||||||||
|
@@ -2922,6 +2711,127 @@ class VPBranchOnMaskRecipe : public VPRecipeBase { | |||||||
} | ||||||||
}; | ||||||||
|
||||||||
/// A recipe to combine multiple recipes into a 'bundle' recipe, which should be | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. The recipes aren't bundled until they're in the recipe so I don't think saying "multiple 'bundled' recipes" is correct. The original comment is correct in that the recipes are separate until they're bundled into this class. |
||||||||
/// considered as single entity for cost-modeling and transforms. The recipe | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Updated, thanks |
||||||||
/// needs to be 'unbundled', i.e. replaced by its individual recipes before | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Updated, thanks |
||||||||
/// execute. | ||||||||
class VPBundleRecipe : public VPSingleDefRecipe { | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. One could bundle recipes that together provide multiple defs, such as interleaved loads. Perhaps more accurately called VPSingleDefBundleRecipe, or There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Updated to |
||||||||
enum class BundleTypes { | ||||||||
ExtendedReduction, | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. So should this be
Suggested change
? |
||||||||
MulAccumulateReduction, | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Done thanks |
||||||||
}; | ||||||||
|
||||||||
/// Recipes bundled together in this VPBundleRecipe. | ||||||||
SmallVector<VPSingleDefRecipe *> BundledOps; | ||||||||
|
||||||||
/// Temporary VPValues used for external operands of the bundle, i.e. operands | ||||||||
/// not defined by recipes in the bundle. | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. These are placeholder VPValues defined temporarily by the bundle recipe itself to feed its bundled recipes. Note that the VPBundleRecipe, being a single def VPValue, feeds out-of bundle recipes itself. |
||||||||
SmallVector<VPValue *> TmpValues; | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Updated, thanks |
||||||||
|
||||||||
/// Type of the bundle. | ||||||||
BundleTypes BundleType; | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Better placed next to the enum definition above, documenting each? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Moved the definition down here, thanks |
||||||||
|
||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Worth documenting, especially \p Operands - perhaps better called CloneOperands, perhaps defined to be optional, passed only to save time? Does it really save anything. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Operands is gone now, moved logic from bundle() directly to the constructor, thanks |
||||||||
VPBundleRecipe(BundleTypes BundleType, ArrayRef<VPSingleDefRecipe *> ToBundle) | ||||||||
: VPSingleDefRecipe(VPDef::VPBundleSC, {}, {}), BundledOps(ToBundle), | ||||||||
BundleType(BundleType) { | ||||||||
// Bundle up the operand recipes. | ||||||||
SmallPtrSet<VPUser *, 4> BundledUsers; | ||||||||
for (auto *R : BundledOps) | ||||||||
BundledUsers.insert(R); | ||||||||
|
||||||||
// Recipes in the bundle, except the last one, must only be used inside the | ||||||||
// bundle. If there other external users, clone the recipes for the bundle. | ||||||||
for (const auto &[Idx, R] : enumerate(drop_end(ToBundle))) { | ||||||||
if (all_of(R->users(), [&BundledUsers](VPUser *U) { | ||||||||
return BundledUsers.contains(U); | ||||||||
})) { | ||||||||
if (R->getParent()) | ||||||||
R->removeFromParent(); | ||||||||
continue; | ||||||||
} | ||||||||
// The users external to the bundle. Clone the recipe for use in the | ||||||||
// bundle and update all its in-bundle users. | ||||||||
VPSingleDefRecipe *Copy = R->clone(); | ||||||||
BundledOps[Idx] = Copy; | ||||||||
BundledUsers.insert(Copy); | ||||||||
R->replaceUsesWithIf(Copy, [&BundledUsers](VPUser &U, unsigned) { | ||||||||
return BundledUsers.contains(&U); | ||||||||
}); | ||||||||
} | ||||||||
BundledOps.back()->removeFromParent(); | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. While experimenting with rebasing #136173 on top of this, I've found that the new bundle recipe can't be used when interleaving. This line for example needs to be gated behind EDIT: I've done some more digging and it could actually be an issue specific to partial reductions. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. It looks like we were missing some test coverage for interleaving VPExtendedReductions/VPMulAccumulateReductions. The issue was that we didn't clone the recipes in the bundle when cloning the VPBundleRecipe. Updated and now it should work fine with interleaving (tested in There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Great, thanks for that. |
||||||||
|
||||||||
// Internalize all external operands to the bundled operations. To do so, | ||||||||
// create new temporary VPValues for all operands not defined by recipe in | ||||||||
// the bundle. The original operands are added as operands of the | ||||||||
// VPBundleRecipe. | ||||||||
for (auto *R : BundledOps) { | ||||||||
for (const auto &[Idx, Op] : enumerate(R->operands())) { | ||||||||
auto *Def = Op->getDefiningRecipe(); | ||||||||
if (Def && BundledUsers.contains(Def)) | ||||||||
continue; | ||||||||
addOperand(Op); | ||||||||
TmpValues.push_back(new VPValue()); | ||||||||
R->setOperand(Idx, TmpValues.back()); | ||||||||
} | ||||||||
} | ||||||||
} | ||||||||
|
||||||||
public: | ||||||||
VPBundleRecipe(VPWidenCastRecipe *Ext, VPReductionRecipe *Red) | ||||||||
: VPBundleRecipe(BundleTypes::ExtendedReduction, {Ext, Red}) {} | ||||||||
VPBundleRecipe(VPWidenRecipe *Mul, VPReductionRecipe *Red) | ||||||||
: VPBundleRecipe(BundleTypes::MulAccumulateReduction, {Mul, Red}) {} | ||||||||
VPBundleRecipe(VPWidenCastRecipe *Ext0, VPWidenCastRecipe *Ext1, | ||||||||
VPWidenRecipe *Mul, VPReductionRecipe *Red) | ||||||||
: VPBundleRecipe(BundleTypes::MulAccumulateReduction, | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Can be defined as ExtMulAccumulateReduction? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Updated the type name of the enum value |
||||||||
{Ext0, Ext1, Mul, Red}) {} | ||||||||
VPBundleRecipe(VPWidenCastRecipe *Ext0, VPWidenCastRecipe *Ext1, | ||||||||
VPWidenRecipe *Mul, VPWidenCastRecipe *Ext2, | ||||||||
VPReductionRecipe *Red) | ||||||||
: VPBundleRecipe(BundleTypes::MulAccumulateReduction, | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Can be defined as ExtMulExtAccumulateReduction? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Yep, thanks |
||||||||
{Ext0, Ext1, Mul, Ext2, Red}) {} | ||||||||
|
||||||||
~VPBundleRecipe() override { | ||||||||
SmallPtrSet<VPRecipeBase *, 4> Seen; | ||||||||
for (auto *R : reverse(BundledOps)) | ||||||||
if (Seen.insert(R).second) | ||||||||
delete R; | ||||||||
for (VPValue *T : TmpValues) | ||||||||
delete T; | ||||||||
} | ||||||||
|
||||||||
VP_CLASSOF_IMPL(VPDef::VPBundleSC) | ||||||||
|
||||||||
VPBundleRecipe *clone() override { | ||||||||
assert(!BundledOps.empty() && "empty bundles should be removed"); | ||||||||
return new VPBundleRecipe(BundleType, BundledOps); | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. What happens if we call this after calling There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. This shouldn't happen, I added an assert. |
||||||||
} | ||||||||
|
||||||||
/// Return the VPSingleDefRecipe producing the final result of the bundled | ||||||||
/// recipe. | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Without loss of generality this can be the last bundled recipe. |
||||||||
VPSingleDefRecipe *getResultOp() const { return BundledOps.back(); } | ||||||||
|
||||||||
/// Insert the bundled recipes back into the VPlan, directly before the | ||||||||
/// current recipe. Leaves the bundle recipe empty and the recipe must be | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Updated, thanks |
||||||||
/// removed before codegen. | ||||||||
void unbundle(); | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Docs needed. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Added thanks. |
||||||||
|
||||||||
/// Generate the extraction of the appropriate bit from the block mask and the | ||||||||
/// conditional branch. | ||||||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
Suggested change
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Updated, thanks |
||||||||
void execute(VPTransformState &State) override { | ||||||||
llvm_unreachable("recipe must be removed before execute"); | ||||||||
} | ||||||||
|
||||||||
InstructionCost computeCost(ElementCount VF, | ||||||||
VPCostContext &Ctx) const override; | ||||||||
|
||||||||
#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) | ||||||||
/// Print the recipe. | ||||||||
void print(raw_ostream &O, const Twine &Indent, | ||||||||
VPSlotTracker &SlotTracker) const override; | ||||||||
#endif | ||||||||
}; | ||||||||
|
||||||||
/// VPPredInstPHIRecipe is a recipe for generating the phi nodes needed when | ||||||||
/// control converges back from a Branch-on-Mask. The phi nodes are needed in | ||||||||
/// order to merge values that are set under such a branch and feed their uses. | ||||||||
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
to be consistent, and place below following lex order.
But would
VPExpressionRecipe
be better - conveying the notion that (a) it produces a single value (b) out of multiple simpler components - which are potentially side-effect-free(?) and potentially (sub)expressions themselves(?). I.e., a bundle recipe can potentially be bundled inside another bundle recipe, unbundle() can be recursive. Worth commenting that this may be possible but that currently bundle recipes are restricted to flat/single-level bundling.There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Another option is
VPIdiomRecipe
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Thanks, updated to VPExpressionRecipe, which is also slightly more compact. Tried to update various places refering to bundle as appropriate, just keeping
unbundle
.