Skip to content

Commit c0f3dfb

Browse files
committed
[DebugInfo] Use variadic debug values to salvage BinOps and GEP instrs with non-const operands
This patch improves salvageDebugInfoImpl by allowing it to salvage arithmetic operations with two or more non-const operands; this includes the GetElementPtr instruction, and most Binary Operator instructions. These salvages produce DIArgList locations and are only valid for dbg.values, as currently variadic DIExpressions must use DW_OP_stack_value. This functionality is also only added for salvageDebugInfoForDbgValues; other functions that directly call salvageDebugInfoImpl (such as in ISel or Coroutine frame building) can be updated in a later patch. Differential Revision: https://reviews.llvm.org/D91722
1 parent ea834c8 commit c0f3dfb

17 files changed

+399
-132
lines changed

llvm/include/llvm/IR/DebugInfoMetadata.h

+14
Original file line numberDiff line numberDiff line change
@@ -2583,6 +2583,16 @@ class DIExpression : public MDNode {
25832583
return Elements[I];
25842584
}
25852585

2586+
/// Return the number of unique location operands referred to (via
2587+
/// DW_OP_LLVM_arg) in this expression; this is not necessarily the number of
2588+
/// instances of DW_OP_LLVM_arg within the expression.
2589+
/// For example, for the expression:
2590+
/// (DW_OP_LLVM_arg 0, DW_OP_LLVM_arg 1, DW_OP_plus,
2591+
/// DW_OP_LLVM_arg 0, DW_OP_mul)
2592+
/// This function would return 2, as there are two unique location operands
2593+
/// (0 and 1).
2594+
uint64_t getNumLocationOperands() const;
2595+
25862596
/// Determine whether this represents a standalone constant value.
25872597
bool isConstant() const;
25882598

@@ -2731,6 +2741,10 @@ class DIExpression : public MDNode {
27312741
/// return true with an offset of zero.
27322742
bool extractIfOffset(int64_t &Offset) const;
27332743

2744+
/// Returns true iff this DIExpression contains at least one instance of
2745+
/// `DW_OP_LLVM_arg, n` for all n in [0, N).
2746+
bool hasAllLocationOps(unsigned N) const;
2747+
27342748
/// Checks if the last 4 elements of the expression are DW_OP_constu <DWARF
27352749
/// Address Space> DW_OP_swap DW_OP_xderef and extracts the <DWARF Address
27362750
/// Space>.

llvm/include/llvm/IR/Instructions.h

+3-1
Original file line numberDiff line numberDiff line change
@@ -1122,7 +1122,9 @@ class GetElementPtrInst : public Instruction {
11221122
/// must be at least as wide as the IntPtr type for the address space of
11231123
/// the base GEP pointer.
11241124
bool accumulateConstantOffset(const DataLayout &DL, APInt &Offset) const;
1125-
1125+
bool collectOffset(const DataLayout &DL, unsigned BitWidth,
1126+
SmallDenseMap<Value *, APInt, 8> &VariableOffsets,
1127+
APInt &ConstantOffset) const;
11261128
// Methods for support type inquiry through isa, cast, and dyn_cast:
11271129
static bool classof(const Instruction *I) {
11281130
return (I->getOpcode() == Instruction::GetElementPtr);

llvm/include/llvm/IR/IntrinsicInst.h

+5
Original file line numberDiff line numberDiff line change
@@ -204,6 +204,11 @@ class DbgVariableIntrinsic : public DbgInfoIntrinsic {
204204

205205
void replaceVariableLocationOp(Value *OldValue, Value *NewValue);
206206
void replaceVariableLocationOp(unsigned OpIdx, Value *NewValue);
207+
/// Adding a new location operand will always result in this intrinsic using
208+
/// an ArgList, and must always be accompanied by a new expression that uses
209+
/// the new operand.
210+
void addVariableLocationOps(ArrayRef<Value *> NewValues,
211+
DIExpression *NewExpr);
207212

208213
void setVariable(DILocalVariable *NewVar) {
209214
setArgOperand(1, MetadataAsValue::get(NewVar->getContext(), NewVar));

llvm/include/llvm/IR/Operator.h

+6
Original file line numberDiff line numberDiff line change
@@ -576,6 +576,12 @@ class GEPOperator
576576
Type *SourceType, ArrayRef<const Value *> Index, const DataLayout &DL,
577577
APInt &Offset,
578578
function_ref<bool(Value &, APInt &)> ExternalAnalysis = nullptr);
579+
580+
/// Collect the offset of this GEP as a map of Values to their associated
581+
/// APInt multipliers, as well as a total Constant Offset.
582+
bool collectOffset(const DataLayout &DL, unsigned BitWidth,
583+
SmallDenseMap<Value *, APInt, 8> &VariableOffsets,
584+
APInt &ConstantOffset) const;
579585
};
580586

581587
class PtrToIntOperator

llvm/include/llvm/Transforms/Utils/Local.h

+2-1
Original file line numberDiff line numberDiff line change
@@ -314,7 +314,8 @@ void salvageDebugInfoForDbgValues(Instruction &I,
314314
/// appended to the expression. \p LocNo: the index of the location operand to
315315
/// which \p I applies, should be 0 for debug info without a DIArgList.
316316
DIExpression *salvageDebugInfoImpl(Instruction &I, DIExpression *DIExpr,
317-
bool StackVal, unsigned LocNo);
317+
bool StackVal, unsigned LocNo,
318+
SmallVectorImpl<Value *> &AdditionalValues);
318319

319320
/// Point debug users of \p From to \p To or salvage them. Use this function
320321
/// only when replacing all uses of \p From with \p To, with a guarantee that

llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

+12-3
Original file line numberDiff line numberDiff line change
@@ -1229,6 +1229,10 @@ void SelectionDAGBuilder::resolveDanglingDebugInfo(const Value *V,
12291229
}
12301230

12311231
void SelectionDAGBuilder::salvageUnresolvedDbgValue(DanglingDebugInfo &DDI) {
1232+
// TODO: For the variadic implementation, instead of only checking the fail
1233+
// state of `handleDebugValue`, we need know specifically which values were
1234+
// invalid, so that we attempt to salvage only those values when processing
1235+
// a DIArgList.
12321236
assert(!DDI.getDI()->hasArgList() &&
12331237
"Not implemented for variadic dbg_values");
12341238
Value *V = DDI.getDI()->getValue(0);
@@ -1252,16 +1256,21 @@ void SelectionDAGBuilder::salvageUnresolvedDbgValue(DanglingDebugInfo &DDI) {
12521256
while (isa<Instruction>(V)) {
12531257
Instruction &VAsInst = *cast<Instruction>(V);
12541258
// Temporary "0", awaiting real implementation.
1255-
DIExpression *NewExpr = salvageDebugInfoImpl(VAsInst, Expr, StackValue, 0);
1259+
SmallVector<Value *, 4> AdditionalValues;
1260+
DIExpression *SalvagedExpr =
1261+
salvageDebugInfoImpl(VAsInst, Expr, StackValue, 0, AdditionalValues);
12561262

12571263
// If we cannot salvage any further, and haven't yet found a suitable debug
12581264
// expression, bail out.
1259-
if (!NewExpr)
1265+
// TODO: If AdditionalValues isn't empty, then the salvage can only be
1266+
// represented with a DBG_VALUE_LIST, so we give up. When we have support
1267+
// here for variadic dbg_values, remove that condition.
1268+
if (!SalvagedExpr || !AdditionalValues.empty())
12601269
break;
12611270

12621271
// New value and expr now represent this debuginfo.
12631272
V = VAsInst.getOperand(0);
1264-
Expr = NewExpr;
1273+
Expr = SalvagedExpr;
12651274

12661275
// Some kind of simplification occurred: check whether the operand of the
12671276
// salvaged debug expression can be encoded in this DAG.

llvm/lib/IR/DebugInfoMetadata.cpp

+21
Original file line numberDiff line numberDiff line change
@@ -1236,6 +1236,17 @@ bool DIExpression::extractIfOffset(int64_t &Offset) const {
12361236
return false;
12371237
}
12381238

1239+
bool DIExpression::hasAllLocationOps(unsigned N) const {
1240+
SmallDenseSet<uint64_t, 4> SeenOps;
1241+
for (auto ExprOp : expr_ops())
1242+
if (ExprOp.getOp() == dwarf::DW_OP_LLVM_arg)
1243+
SeenOps.insert(ExprOp.getArg(0));
1244+
for (uint64_t Idx = 0; Idx < N; ++Idx)
1245+
if (!is_contained(SeenOps, Idx))
1246+
return false;
1247+
return true;
1248+
}
1249+
12391250
const DIExpression *DIExpression::extractAddressClass(const DIExpression *Expr,
12401251
unsigned &AddrClass) {
12411252
// FIXME: This seems fragile. Nothing that verifies that these elements
@@ -1450,6 +1461,16 @@ Optional<DIExpression *> DIExpression::createFragmentExpression(
14501461
return DIExpression::get(Expr->getContext(), Ops);
14511462
}
14521463

1464+
uint64_t DIExpression::getNumLocationOperands() const {
1465+
uint64_t Result = 0;
1466+
for (auto ExprOp : expr_ops())
1467+
if (ExprOp.getOp() == dwarf::DW_OP_LLVM_arg)
1468+
Result = std::max(Result, ExprOp.getArg(0) + 1);
1469+
assert(hasAllLocationOps(Result) &&
1470+
"Expression is missing one or more location operands.");
1471+
return Result;
1472+
}
1473+
14531474
bool DIExpression::isConstant() const {
14541475
// Recognize DW_OP_constu C DW_OP_stack_value (DW_OP_LLVM_fragment Len Ofs)?.
14551476
if (getNumElements() != 3 && getNumElements() != 6)

llvm/lib/IR/Instructions.cpp

+9
Original file line numberDiff line numberDiff line change
@@ -1793,6 +1793,15 @@ bool GetElementPtrInst::accumulateConstantOffset(const DataLayout &DL,
17931793
return cast<GEPOperator>(this)->accumulateConstantOffset(DL, Offset);
17941794
}
17951795

1796+
bool GetElementPtrInst::collectOffset(
1797+
const DataLayout &DL, unsigned BitWidth,
1798+
SmallDenseMap<Value *, APInt, 8> &VariableOffsets,
1799+
APInt &ConstantOffset) const {
1800+
// Delegate to the generic GEPOperator implementation.
1801+
return cast<GEPOperator>(this)->collectOffset(DL, BitWidth, VariableOffsets,
1802+
ConstantOffset);
1803+
}
1804+
17961805
//===----------------------------------------------------------------------===//
17971806
// ExtractElementInst Implementation
17981807
//===----------------------------------------------------------------------===//

llvm/lib/IR/IntrinsicInst.cpp

+17
Original file line numberDiff line numberDiff line change
@@ -117,6 +117,23 @@ void DbgVariableIntrinsic::replaceVariableLocationOp(unsigned OpIdx,
117117
0, MetadataAsValue::get(getContext(), DIArgList::get(getContext(), MDs)));
118118
}
119119

120+
void DbgVariableIntrinsic::addVariableLocationOps(ArrayRef<Value *> NewValues,
121+
DIExpression *NewExpr) {
122+
assert(NewExpr->hasAllLocationOps(getNumVariableLocationOps() +
123+
NewValues.size()) &&
124+
"NewExpr for debug variable intrinsic does not reference every "
125+
"location operand.");
126+
assert(!is_contained(NewValues, nullptr) && "New values must be non-null");
127+
setArgOperand(2, MetadataAsValue::get(getContext(), NewExpr));
128+
SmallVector<ValueAsMetadata *, 4> MDs;
129+
for (auto *VMD : location_ops())
130+
MDs.push_back(getAsMetadata(VMD));
131+
for (auto *VMD : NewValues)
132+
MDs.push_back(getAsMetadata(VMD));
133+
setArgOperand(
134+
0, MetadataAsValue::get(getContext(), DIArgList::get(getContext(), MDs)));
135+
}
136+
120137
Optional<uint64_t> DbgVariableIntrinsic::getFragmentSizeInBits() const {
121138
if (auto Fragment = getExpression()->getFragmentInfo())
122139
return Fragment->SizeInBits;

llvm/lib/IR/Operator.cpp

+57
Original file line numberDiff line numberDiff line change
@@ -142,4 +142,61 @@ bool GEPOperator::accumulateConstantOffset(
142142
}
143143
return true;
144144
}
145+
146+
bool GEPOperator::collectOffset(
147+
const DataLayout &DL, unsigned BitWidth,
148+
SmallDenseMap<Value *, APInt, 8> &VariableOffsets,
149+
APInt &ConstantOffset) const {
150+
assert(BitWidth == DL.getIndexSizeInBits(getPointerAddressSpace()) &&
151+
"The offset bit width does not match DL specification.");
152+
153+
auto CollectConstantOffset = [&](APInt Index, uint64_t Size) {
154+
Index = Index.sextOrTrunc(BitWidth);
155+
APInt IndexedSize = APInt(BitWidth, Size);
156+
ConstantOffset += Index * IndexedSize;
157+
};
158+
159+
for (gep_type_iterator GTI = gep_type_begin(this), GTE = gep_type_end(this);
160+
GTI != GTE; ++GTI) {
161+
// Scalable vectors are multiplied by a runtime constant.
162+
bool ScalableType = isa<ScalableVectorType>(GTI.getIndexedType());
163+
164+
Value *V = GTI.getOperand();
165+
StructType *STy = GTI.getStructTypeOrNull();
166+
// Handle ConstantInt if possible.
167+
if (auto ConstOffset = dyn_cast<ConstantInt>(V)) {
168+
if (ConstOffset->isZero())
169+
continue;
170+
// If the type is scalable and the constant is not zero (vscale * n * 0 =
171+
// 0) bailout.
172+
// TODO: If the runtime value is accessible at any point before DWARF
173+
// emission, then we could potentially keep a forward reference to it
174+
// in the debug value to be filled in later.
175+
if (ScalableType)
176+
return false;
177+
// Handle a struct index, which adds its field offset to the pointer.
178+
if (STy) {
179+
unsigned ElementIdx = ConstOffset->getZExtValue();
180+
const StructLayout *SL = DL.getStructLayout(STy);
181+
// Element offset is in bytes.
182+
CollectConstantOffset(APInt(BitWidth, SL->getElementOffset(ElementIdx)),
183+
1);
184+
continue;
185+
}
186+
CollectConstantOffset(ConstOffset->getValue(),
187+
DL.getTypeAllocSize(GTI.getIndexedType()));
188+
continue;
189+
}
190+
191+
if (STy || ScalableType)
192+
return false;
193+
// Insert an initial offset of 0 for V iff none exists already, then
194+
// increment the offset by IndexedSize.
195+
VariableOffsets.try_emplace(V, BitWidth, 0);
196+
APInt IndexedSize =
197+
APInt(BitWidth, DL.getTypeAllocSize(GTI.getIndexedType()));
198+
VariableOffsets[V] += IndexedSize;
199+
}
200+
return true;
201+
}
145202
} // namespace llvm

llvm/lib/Transforms/Coroutines/CoroFrame.cpp

+9-4
Original file line numberDiff line numberDiff line change
@@ -2172,10 +2172,15 @@ void coro::salvageDebugInfo(
21722172
} else if (auto *StInst = dyn_cast<StoreInst>(Storage)) {
21732173
Storage = StInst->getOperand(0);
21742174
} else if (auto *GEPInst = dyn_cast<GetElementPtrInst>(Storage)) {
2175-
Expr = llvm::salvageDebugInfoImpl(*GEPInst, Expr,
2176-
/*WithStackValue=*/false, 0);
2177-
if (!Expr)
2178-
return;
2175+
SmallVector<Value *> AdditionalValues;
2176+
DIExpression *SalvagedExpr = llvm::salvageDebugInfoImpl(
2177+
*GEPInst, Expr,
2178+
/*WithStackValue=*/false, 0, AdditionalValues);
2179+
// Debug declares cannot currently handle additional location
2180+
// operands.
2181+
if (!SalvagedExpr || !AdditionalValues.empty())
2182+
break;
2183+
Expr = SalvagedExpr;
21792184
Storage = GEPInst->getOperand(0);
21802185
} else if (auto *BCInst = dyn_cast<llvm::BitCastInst>(Storage))
21812186
Storage = BCInst->getOperand(0);

0 commit comments

Comments
 (0)