Skip to content

Commit 858d1df

Browse files
committed
LiveIntervalAnalysis: Fix missing defs in renameDisconnectedComponents().
Fix renameDisconnectedComponents() creating vreg uses that can be reached from function begin withouthaving a definition (or explicit live-in). Fix this by inserting IMPLICIT_DEF instruction before control-flow joins as necessary. Removes an assert from MachineScheduler because we may now get additional IMPLICIT_DEF when preparing the scheduling policy. This fixes the underlying problem of http://llvm.org/PR27705 llvm-svn: 270259
1 parent 5973bc8 commit 858d1df

File tree

5 files changed

+97
-17
lines changed

5 files changed

+97
-17
lines changed

llvm/include/llvm/CodeGen/LiveInterval.h

+4-2
Original file line numberDiff line numberDiff line change
@@ -896,10 +896,12 @@ namespace llvm {
896896
class ConnectedSubRegClasses {
897897
LiveIntervals &LIS;
898898
MachineRegisterInfo &MRI;
899+
const TargetInstrInfo &TII;
899900

900901
public:
901-
ConnectedSubRegClasses(LiveIntervals &LIS, MachineRegisterInfo &MRI)
902-
: LIS(LIS), MRI(MRI) {}
902+
ConnectedSubRegClasses(LiveIntervals &LIS, MachineRegisterInfo &MRI,
903+
const TargetInstrInfo &TII)
904+
: LIS(LIS), MRI(MRI), TII(TII) {}
903905

904906
/// Split unrelated subregister components and rename them to new vregs.
905907
void renameComponents(LiveInterval &LI) const;

llvm/lib/CodeGen/LiveInterval.cpp

+57-7
Original file line numberDiff line numberDiff line change
@@ -19,13 +19,17 @@
1919
//===----------------------------------------------------------------------===//
2020

2121
#include "llvm/CodeGen/LiveInterval.h"
22+
23+
#include "PHIEliminationUtils.h"
2224
#include "RegisterCoalescer.h"
2325
#include "llvm/ADT/STLExtras.h"
2426
#include "llvm/ADT/SmallSet.h"
2527
#include "llvm/CodeGen/LiveIntervalAnalysis.h"
28+
#include "llvm/CodeGen/MachineInstrBuilder.h"
2629
#include "llvm/CodeGen/MachineRegisterInfo.h"
2730
#include "llvm/Support/Debug.h"
2831
#include "llvm/Support/raw_ostream.h"
32+
#include "llvm/Target/TargetInstrInfo.h"
2933
#include "llvm/Target/TargetRegisterInfo.h"
3034
#include <algorithm>
3135
using namespace llvm;
@@ -1654,19 +1658,65 @@ void ConnectedSubRegClasses::distribute(const IntEqClasses &Classes,
16541658
}
16551659
}
16561660

1661+
static bool subRangeLiveAt(const LiveInterval &LI, SlotIndex Pos) {
1662+
for (const LiveInterval::SubRange &SR : LI.subranges()) {
1663+
if (SR.liveAt(Pos))
1664+
return true;
1665+
}
1666+
return false;
1667+
}
1668+
16571669
void ConnectedSubRegClasses::computeMainRangesFixFlags(
16581670
const IntEqClasses &Classes,
16591671
const SmallVectorImpl<SubRangeInfo> &SubRangeInfos,
16601672
const SmallVectorImpl<LiveInterval*> &Intervals) const {
16611673
BumpPtrAllocator &Allocator = LIS.getVNInfoAllocator();
1674+
const SlotIndexes &Indexes = *LIS.getSlotIndexes();
16621675
for (size_t I = 0, E = Intervals.size(); I < E; ++I) {
1663-
LiveInterval *LI = Intervals[I];
1664-
LI->removeEmptySubRanges();
1676+
LiveInterval &LI = *Intervals[I];
1677+
unsigned Reg = LI.reg;
1678+
1679+
// There must be a def (or live-in) before every use. Splitting vregs may
1680+
// violate this principle as the splitted vreg may not have a definition on
1681+
// every path. Fix this by creating IMPLICIT_DEF instruction as necessary.
1682+
VNInfo::Allocator &VNInfoAllocator = LIS.getVNInfoAllocator();
1683+
for (const LiveInterval::SubRange &SR : LI.subranges()) {
1684+
// Search for "PHI" value numbers in the subranges. We must find a live
1685+
// value in each predecessor block, add an IMPLICIT_DEF where it is
1686+
// missing.
1687+
for (unsigned I = 0; I < SR.valnos.size(); ++I) {
1688+
const VNInfo &VNI = *SR.valnos[I];
1689+
if (VNI.isUnused() || !VNI.isPHIDef())
1690+
continue;
1691+
1692+
SlotIndex Def = VNI.def;
1693+
MachineBasicBlock &MBB = *Indexes.getMBBFromIndex(Def);
1694+
for (MachineBasicBlock *PredMBB : MBB.predecessors()) {
1695+
SlotIndex PredEnd = Indexes.getMBBEndIdx(PredMBB);
1696+
if (subRangeLiveAt(LI, PredEnd.getPrevSlot()))
1697+
continue;
1698+
1699+
MachineBasicBlock::iterator InsertPos =
1700+
llvm::findPHICopyInsertPoint(PredMBB, &MBB, Reg);
1701+
const MCInstrDesc &MCDesc = TII.get(TargetOpcode::IMPLICIT_DEF);
1702+
MachineInstrBuilder ImpDef = BuildMI(*PredMBB, InsertPos,
1703+
DebugLoc(), MCDesc, Reg);
1704+
SlotIndex DefIdx = LIS.InsertMachineInstrInMaps(*ImpDef);
1705+
SlotIndex RegDefIdx = DefIdx.getRegSlot();
1706+
for (LiveInterval::SubRange &SR : LI.subranges()) {
1707+
VNInfo *SRVNI = SR.getNextValue(RegDefIdx, VNInfoAllocator);
1708+
SR.addSegment(LiveRange::Segment(RegDefIdx, PredEnd, SRVNI));
1709+
}
1710+
}
1711+
}
1712+
}
1713+
1714+
LI.removeEmptySubRanges();
16651715
if (I == 0)
1666-
LI->clear();
1667-
LI->constructMainRangeFromSubranges(*LIS.getSlotIndexes(), Allocator);
1716+
LI.clear();
1717+
LI.constructMainRangeFromSubranges(*LIS.getSlotIndexes(), Allocator);
16681718

1669-
for (MachineOperand &MO : MRI.reg_nodbg_operands(LI->reg)) {
1719+
for (MachineOperand &MO : MRI.reg_nodbg_operands(Reg)) {
16701720
if (!MO.isDef())
16711721
continue;
16721722
unsigned SubRegIdx = MO.getSubReg();
@@ -1677,12 +1727,12 @@ void ConnectedSubRegClasses::computeMainRangesFixFlags(
16771727
// flags in these cases.
16781728
if (!MO.isUndef()) {
16791729
SlotIndex Pos = LIS.getInstructionIndex(*MO.getParent());
1680-
if (!LI->liveAt(Pos.getBaseIndex()))
1730+
if (!LI.liveAt(Pos.getBaseIndex()))
16811731
MO.setIsUndef();
16821732
}
16831733
if (!MO.isDead()) {
16841734
SlotIndex Pos = LIS.getInstructionIndex(*MO.getParent());
1685-
if (!LI->liveAt(Pos.getDeadSlot()))
1735+
if (!LI.liveAt(Pos.getDeadSlot()))
16861736
MO.setIsDead();
16871737
}
16881738
}

llvm/lib/CodeGen/LiveIntervalAnalysis.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -1571,7 +1571,7 @@ void LiveIntervals::splitSeparateComponents(LiveInterval &LI,
15711571
}
15721572

15731573
void LiveIntervals::renameDisconnectedComponents() {
1574-
ConnectedSubRegClasses SubRegClasses(*this, *MRI);
1574+
ConnectedSubRegClasses SubRegClasses(*this, *MRI, *TII);
15751575

15761576
// Iterate over all vregs. Note that we query getNumVirtRegs() the newly
15771577
// created vregs end up with higher numbers but do not need to be visited as

llvm/lib/CodeGen/MachineScheduler.cpp

+2-7
Original file line numberDiff line numberDiff line change
@@ -444,23 +444,20 @@ void MachineSchedulerBase::scheduleRegions(ScheduleDAGInstrs &Scheduler,
444444
//
445445
// MBB::size() uses instr_iterator to count. Here we need a bundle to count
446446
// as a single instruction.
447-
unsigned RemainingInstrs = std::distance(MBB->begin(), MBB->end());
448447
for(MachineBasicBlock::iterator RegionEnd = MBB->end();
449448
RegionEnd != MBB->begin(); RegionEnd = Scheduler.begin()) {
450449

451450
// Avoid decrementing RegionEnd for blocks with no terminator.
452451
if (RegionEnd != MBB->end() ||
453452
isSchedBoundary(&*std::prev(RegionEnd), &*MBB, MF, TII)) {
454453
--RegionEnd;
455-
// Count the boundary instruction.
456-
--RemainingInstrs;
457454
}
458455

459456
// The next region starts above the previous region. Look backward in the
460457
// instruction stream until we find the nearest boundary.
461458
unsigned NumRegionInstrs = 0;
462459
MachineBasicBlock::iterator I = RegionEnd;
463-
for(;I != MBB->begin(); --I, --RemainingInstrs) {
460+
for (;I != MBB->begin(); --I) {
464461
if (isSchedBoundary(&*std::prev(I), &*MBB, MF, TII))
465462
break;
466463
if (!I->isDebugValue())
@@ -483,8 +480,7 @@ void MachineSchedulerBase::scheduleRegions(ScheduleDAGInstrs &Scheduler,
483480
<< "\n From: " << *I << " To: ";
484481
if (RegionEnd != MBB->end()) dbgs() << *RegionEnd;
485482
else dbgs() << "End";
486-
dbgs() << " RegionInstrs: " << NumRegionInstrs
487-
<< " Remaining: " << RemainingInstrs << "\n");
483+
dbgs() << " RegionInstrs: " << NumRegionInstrs << '\n');
488484
if (DumpCriticalPathLength) {
489485
errs() << MF->getName();
490486
errs() << ":BB# " << MBB->getNumber();
@@ -502,7 +498,6 @@ void MachineSchedulerBase::scheduleRegions(ScheduleDAGInstrs &Scheduler,
502498
// scheduler for the top of it's scheduled region.
503499
RegionEnd = Scheduler.begin();
504500
}
505-
assert(RemainingInstrs == 0 && "Instruction count mismatch!");
506501
Scheduler.finishBlock();
507502
// FIXME: Ideally, no further passes should rely on kill flags. However,
508503
// thumb2 size reduction is currently an exception, so the PostMIScheduler
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,33 @@
1+
; RUN: llc -verify-machineinstrs -o /dev/null %s
2+
; Check that renameDisconnectedComponents() does not create vregs without a
3+
; definition on every path (there should at least be IMPLICIT_DEF instructions).
4+
target triple = "amdgcn--"
5+
6+
define void @func() {
7+
B0:
8+
br i1 undef, label %B1, label %B2
9+
10+
B1:
11+
br label %B2
12+
13+
B2:
14+
%v0 = phi <4 x float> [ zeroinitializer, %B1 ], [ <float 0.0, float 0.0, float 0.0, float undef>, %B0 ]
15+
br i1 undef, label %B20.1, label %B20.2
16+
17+
B20.1:
18+
br label %B20.2
19+
20+
B20.2:
21+
%v2 = phi <4 x float> [ zeroinitializer, %B20.1 ], [ %v0, %B2 ]
22+
br i1 undef, label %B30.1, label %B30.2
23+
24+
B30.1:
25+
%sub = fsub <4 x float> %v2, undef
26+
br label %B30.2
27+
28+
B30.2:
29+
%v3 = phi <4 x float> [ %sub, %B30.1 ], [ %v2, %B20.2 ]
30+
%ve0 = extractelement <4 x float> %v3, i32 0
31+
store float %ve0, float addrspace(3)* undef, align 4
32+
ret void
33+
}

0 commit comments

Comments
 (0)