Skip to content

Commit 0b0d112

Browse files
committed
Avoid control flow for copying heap allocations to temporaries
Updates of all the temporaries that contain the address of a candidate object for cold block heapification are currently guarded with ifacmpne instructions. In order to simplify the control flow graph produced for heapification before cold blocks, replace the conditional update of each temporary with an unconditional store using the result of an aternary instruction that either updates the temporary with the heap object address or with the current contents of the temporary unconditionally. This update is inserted into the start of the cold block rather than in a new block preceding the cold block. This is only done if code generation supports ternary opcodes. If ternary opcodes are not supported, ifacmpne checks are still generated instead. The ifacmpne checks can also be forced by setting the environment variable TR_disableTernaryOpForEA. Signed-off-by: Henry Zongaro <zongaro@ca.ibm.com>
1 parent 4e465a0 commit 0b0d112

File tree

2 files changed

+134
-58
lines changed

2 files changed

+134
-58
lines changed

runtime/compiler/optimizer/EscapeAnalysis.cpp

+116-56
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*******************************************************************************
2-
* Copyright (c) 2000, 2019 IBM Corp. and others
2+
* Copyright (c) 2000, 2020 IBM Corp. and others
33
*
44
* This program and the accompanying materials are made available under
55
* the terms of the Eclipse Public License 2.0 which accompanies this
@@ -1290,7 +1290,7 @@ int32_t TR_EscapeAnalysis::performAnalysisOnce()
12901290

12911291
if (candidate->escapesInColdBlocks())
12921292
{
1293-
heapifyBeforeColdBlocks(candidate);
1293+
heapifyForColdBlocks(candidate);
12941294
if (candidate->_fields)
12951295
{
12961296
int32_t i;
@@ -7053,8 +7053,11 @@ void TR_EscapeAnalysis::makeNonContiguousLocalAllocation(Candidate *candidate)
70537053

70547054

70557055

7056-
void TR_EscapeAnalysis::heapifyBeforeColdBlocks(Candidate *candidate)
7056+
void TR_EscapeAnalysis::heapifyForColdBlocks(Candidate *candidate)
70577057
{
7058+
static char *disableTernaryOpForEA = feGetEnv("TR_disableTernaryOpForEA");
7059+
bool useTernaryOp = !disableTernaryOpForEA && cg()->getSupportsTernary();
7060+
70587061
if (comp()->suppressAllocationInlining())
70597062
return;
70607063

@@ -7406,73 +7409,103 @@ void TR_EscapeAnalysis::heapifyBeforeColdBlocks(Candidate *candidate)
74067409
}
74077410
}
74087411

7412+
TR::TreeTop *insertSymRefStoresAfter = NULL;
7413+
7414+
// If using aternary to perform comparisons, all compares and stores are
7415+
// inserted directly at the start of the cold block
7416+
if (useTernaryOp)
7417+
{
7418+
insertSymRefStoresAfter = coldBlock->getEntry();
7419+
}
7420+
74097421
ListIterator<TR::SymbolReference> symRefsIt(candidate->getSymRefs());
74107422
TR::SymbolReference *symRef;
7423+
bool generatedReusedOperations = false;
7424+
TR::Node *heapTempLoad = NULL;
7425+
TR::Node *candidateStackAddrLoad = NULL;
7426+
74117427
for (symRef = symRefsIt.getFirst(); symRef; symRef = symRefsIt.getNext())
74127428
{
74137429
//
7414-
// Now create the compares (one for each node) and
7415-
// stores if required
7430+
// Now create the compares (one for each node) and stores
74167431
//
7417-
TR::Node *comparisonNode = TR::Node::createif(TR::ifacmpne, TR::Node::createWithSymRef(candidate->_node, TR::aload, 0, symRef), candidate->_node->duplicateTree(), targetBlock->getEntry());
7418-
TR::TreeTop *comparisonTree = TR::TreeTop::create(comp(), comparisonNode, NULL, NULL);
7419-
TR::Block *comparisonBlock = toBlock(cfg->addNode(TR::Block::createEmptyBlock(comparisonNode, comp(), coldBlock->getFrequency())));
7420-
comparisonBlock->inheritBlockInfo(coldBlock, coldBlock->isCold());
7432+
if (useTernaryOp)
7433+
{
7434+
// Reload address of object on heap just once for this block
7435+
if (!heapTempLoad)
7436+
{
7437+
heapTempLoad = TR::Node::createWithSymRef(candidate->_node, TR::aload, 0, heapSymRef);
7438+
candidateStackAddrLoad = candidate->_node->duplicateTree();
7439+
}
74217440

7422-
TR::TreeTop *comparisonEntryTree = comparisonBlock->getEntry();
7423-
TR::TreeTop *comparisonExitTree = comparisonBlock->getExit();
7424-
comparisonEntryTree->join(comparisonTree);
7425-
comparisonTree->join(comparisonExitTree);
7441+
// If variable has address of the stack allocated object, replace
7442+
// with the value of the heap allocated object; otherwise, keep the
7443+
// current value
7444+
//
7445+
// astore <object-temp>
7446+
// aternary
7447+
// acmpeq
7448+
// aload <object-temp>
7449+
// loadaddr <stack-obj>
7450+
// aload <heap-allocated-obj>
7451+
// aload <object-temp>
7452+
//
7453+
TR::Node *symLoad = TR::Node::createWithSymRef(candidate->_node, TR::aload, 0, symRef);
7454+
TR::Node *addrCompareNode = TR::Node::create(candidate->_node, TR::acmpeq, 2, symLoad, candidateStackAddrLoad);
7455+
TR::Node *chooseAddrNode = TR::Node::create(TR::aternary, 3, addrCompareNode, heapTempLoad, symLoad);
7456+
7457+
TR::TreeTop *storeTree = storeHeapifiedToTemp(candidate, chooseAddrNode, symRef);
7458+
7459+
storeTree->join(insertSymRefStoresAfter->getNextTreeTop());
7460+
insertSymRefStoresAfter->join(storeTree);
7461+
}
7462+
else
7463+
{
7464+
TR::Node *comparisonNode = TR::Node::createif(TR::ifacmpne, TR::Node::createWithSymRef(candidate->_node, TR::aload, 0, symRef), candidate->_node->duplicateTree(), targetBlock->getEntry());
7465+
TR::TreeTop *comparisonTree = TR::TreeTop::create(comp(), comparisonNode, NULL, NULL);
7466+
TR::Block *comparisonBlock = toBlock(cfg->addNode(TR::Block::createEmptyBlock(comparisonNode, comp(), coldBlock->getFrequency())));
7467+
comparisonBlock->inheritBlockInfo(coldBlock, coldBlock->isCold());
74267468

7427-
comparisonExitTree->join(insertionPoint);
7469+
TR::TreeTop *comparisonEntryTree = comparisonBlock->getEntry();
7470+
TR::TreeTop *comparisonExitTree = comparisonBlock->getExit();
7471+
comparisonEntryTree->join(comparisonTree);
7472+
comparisonTree->join(comparisonExitTree);
74287473

7429-
if (treeBeforeInsertionPoint)
7430-
treeBeforeInsertionPoint->join(comparisonEntryTree);
7431-
else
7432-
comp()->setStartTree(comparisonEntryTree);
7474+
comparisonExitTree->join(insertionPoint);
74337475

7434-
TR::Node *storeNode = TR::Node::createWithSymRef(TR::astore, 1, 1, TR::Node::createWithSymRef(comparisonNode, TR::aload, 0, heapSymRef), symRef);
7435-
if (symRef->getSymbol()->holdsMonitoredObject())
7436-
storeNode->setLiveMonitorInitStore(true);
7437-
storeNode->setHeapificationStore(true);
7438-
TR::TreeTop *storeTree = TR::TreeTop::create(comp(), storeNode, NULL, NULL);
7476+
if (treeBeforeInsertionPoint)
7477+
treeBeforeInsertionPoint->join(comparisonEntryTree);
7478+
else
7479+
comp()->setStartTree(comparisonEntryTree);
74397480

7481+
TR::Node *heapifiedObjAddrLoad = TR::Node::createWithSymRef(comparisonNode, TR::aload, 0, heapSymRef);
74407482

7441-
if (!symRef->getSymbol()->isParm())
7442-
{
7443-
TR::Node *initStoreNode = TR::Node::createWithSymRef(TR::astore, 1, 1, TR::Node::aconst(comparisonNode, 0), symRef);
7444-
if (symRef->getSymbol()->holdsMonitoredObject())
7445-
initStoreNode->setLiveMonitorInitStore(true);
7446-
TR::TreeTop *initStoreTree = TR::TreeTop::create(comp(), initStoreNode, NULL, NULL);
7447-
TR::TreeTop *startTree = comp()->getStartTree();
7448-
TR::TreeTop *nextToStart = startTree->getNextTreeTop();
7449-
startTree->join(initStoreTree);
7450-
initStoreTree->join(nextToStart);
7451-
}
7483+
TR::TreeTop *storeTree = storeHeapifiedToTemp(candidate, heapifiedObjAddrLoad, symRef);
74527484

7453-
TR::Block *storeBlock = toBlock(cfg->addNode(TR::Block::createEmptyBlock(storeNode, comp(), coldBlock->getFrequency())));
7454-
storeBlock->inheritBlockInfo(coldBlock, coldBlock->isCold());
7485+
TR::Block *storeBlock = toBlock(cfg->addNode(TR::Block::createEmptyBlock(storeTree->getNode(), comp(), coldBlock->getFrequency())));
7486+
storeBlock->inheritBlockInfo(coldBlock, coldBlock->isCold());
74557487

7456-
cfg->addEdge(comparisonBlock, storeBlock);
7457-
cfg->addEdge(comparisonBlock, targetBlock);
7458-
cfg->addEdge(storeBlock, targetBlock);
7459-
if (targetBlock == coldBlock)
7460-
{
7461-
lastComparisonBlock = comparisonBlock;
7462-
lastStoreBlock = storeBlock;
7463-
}
7488+
cfg->addEdge(comparisonBlock, storeBlock);
7489+
cfg->addEdge(comparisonBlock, targetBlock);
7490+
cfg->addEdge(storeBlock, targetBlock);
7491+
if (targetBlock == coldBlock)
7492+
{
7493+
lastComparisonBlock = comparisonBlock;
7494+
lastStoreBlock = storeBlock;
7495+
}
74647496

7465-
TR::TreeTop *storeEntryTree = storeBlock->getEntry();
7466-
TR::TreeTop *storeExitTree = storeBlock->getExit();
7497+
TR::TreeTop *storeEntryTree = storeBlock->getEntry();
7498+
TR::TreeTop *storeExitTree = storeBlock->getExit();
74677499

7468-
comparisonExitTree->join(storeEntryTree);
7469-
storeEntryTree->join(storeTree);
7470-
storeTree->join(storeExitTree);
7471-
storeExitTree->join(insertionPoint);
7500+
comparisonExitTree->join(storeEntryTree);
7501+
storeEntryTree->join(storeTree);
7502+
storeTree->join(storeExitTree);
7503+
storeExitTree->join(insertionPoint);
74727504

7473-
insertionPoint = comparisonEntryTree;
7474-
treeBeforeInsertionPoint = insertionPoint->getPrevTreeTop();
7475-
targetBlock = comparisonBlock;
7505+
insertionPoint = comparisonEntryTree;
7506+
treeBeforeInsertionPoint = insertionPoint->getPrevTreeTop();
7507+
targetBlock = comparisonBlock;
7508+
}
74767509
}
74777510

74787511
cfg->addEdge(heapAllocationBlock, targetBlock);
@@ -7484,9 +7517,11 @@ void TR_EscapeAnalysis::heapifyBeforeColdBlocks(Candidate *candidate)
74847517
TR::CFGNode *predNode = (*pred)->getFrom();
74857518
/* might be removed, keep reference to next object in list */
74867519
pred++;
7487-
if (((predNode != lastComparisonBlock) &&
7488-
(predNode != lastStoreBlock)) ||
7489-
coldBlock->isCatchBlock())
7520+
if ((useTernaryOp && (predNode != heapComparisonBlock)
7521+
&& (predNode != heapAllocationBlock))
7522+
|| (!useTernaryOp && (predNode != lastComparisonBlock)
7523+
&& (predNode != lastStoreBlock))
7524+
|| coldBlock->isCatchBlock())
74907525
{
74917526
TR::Block *predBlock = toBlock(predNode);
74927527
if (!coldBlock->isCatchBlock() &&
@@ -7607,6 +7642,31 @@ void TR_EscapeAnalysis::heapifyBeforeColdBlocks(Candidate *candidate)
76077642
}
76087643

76097644

7645+
TR::TreeTop *TR_EscapeAnalysis::storeHeapifiedToTemp(Candidate *candidate, TR::Node *value, TR::SymbolReference *symRef)
7646+
{
7647+
TR::Node *storeNode = TR::Node::createWithSymRef(TR::astore, 1, 1, value, symRef);
7648+
TR::TreeTop *storeTree = TR::TreeTop::create(comp(), storeNode, NULL, NULL);
7649+
7650+
if (symRef->getSymbol()->holdsMonitoredObject())
7651+
{
7652+
storeNode->setLiveMonitorInitStore(true);
7653+
}
7654+
storeNode->setHeapificationStore(true);
7655+
7656+
if (!symRef->getSymbol()->isParm())
7657+
{
7658+
TR::Node *initStoreNode = TR::Node::createWithSymRef(TR::astore, 1, 1, TR::Node::aconst(candidate->_node, 0), symRef);
7659+
if (symRef->getSymbol()->holdsMonitoredObject())
7660+
initStoreNode->setLiveMonitorInitStore(true);
7661+
TR::TreeTop *initStoreTree = TR::TreeTop::create(comp(), initStoreNode, NULL, NULL);
7662+
TR::TreeTop *startTree = comp()->getStartTree();
7663+
TR::TreeTop *nextToStart = startTree->getNextTreeTop();
7664+
startTree->join(initStoreTree);
7665+
initStoreTree->join(nextToStart);
7666+
}
7667+
7668+
return storeTree;
7669+
}
76107670

76117671

76127672
bool TR_EscapeAnalysis::devirtualizeCallSites()

runtime/compiler/optimizer/EscapeAnalysis.hpp

+18-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*******************************************************************************
2-
* Copyright (c) 2000, 2019 IBM Corp. and others
2+
* Copyright (c) 2000, 2020 IBM Corp. and others
33
*
44
* This program and the accompanying materials are made available under
55
* the terms of the Eclipse Public License 2.0 which accompanies this
@@ -590,7 +590,23 @@ class TR_EscapeAnalysis : public TR::Optimization
590590

591591
void makeContiguousLocalAllocation(Candidate *candidate);
592592
void makeNonContiguousLocalAllocation(Candidate *candidate);
593-
void heapifyBeforeColdBlocks(Candidate *candidate);
593+
void heapifyForColdBlocks(Candidate *candidate);
594+
595+
/**
596+
* \brief Store the supplied address to the specified temporary
597+
*
598+
* \param candidate
599+
* The candidate that is being heapified
600+
*
601+
* \param addr
602+
* The address of the possibly heapified object
603+
*
604+
* \param symRef
605+
* The \ref TR::SymbolReference for the temporay
606+
*
607+
* \return A pointer to the \ref TR::TreeTop containing the store
608+
*/
609+
TR::TreeTop *storeHeapifiedToTemp(Candidate *candidate, TR::Node *addr, TR::SymbolReference *symRef);
594610
bool inlineCallSites();
595611
void scanForExtraCallsToInline();
596612
bool alwaysWorthInlining(TR::Node *callNode);

0 commit comments

Comments
 (0)