Skip to content

Commit c3ec80f

Browse files
committed
[SystemZ] Handle SADDO et.al. and ADD/SUBCARRY
This provides an optimized implementation of SADDO/SSUBO/UADDO/USUBO as well as ADDCARRY/SUBCARRY on top of the new CC implementation. In particular, multi-word arithmetic now uses UADDO/ADDCARRY instead of the old ADDC/ADDE logic, which means we no longer need to use "glue" links for those instructions. This also allows making full use of the memory-based instructions like ALSI, which couldn't be recognized due to limitations in the DAG matcher previously. Also, the llvm.sadd.with.overflow et.al. intrinsincs now expand to directly using the ADD instructions and checking for a CC 3 result. llvm-svn: 331203
1 parent b32f365 commit c3ec80f

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

51 files changed

+11018
-79
lines changed

llvm/lib/Target/SystemZ/SystemZ.h

+16
Original file line numberDiff line numberDiff line change
@@ -47,6 +47,22 @@ const unsigned CCMASK_CMP_O = CCMASK_ANY ^ CCMASK_CMP_UO;
4747
const unsigned CCMASK_ICMP = CCMASK_0 | CCMASK_1 | CCMASK_2;
4848
const unsigned CCMASK_FCMP = CCMASK_0 | CCMASK_1 | CCMASK_2 | CCMASK_3;
4949

50+
// Condition-code mask assignments for arithmetical operations.
51+
const unsigned CCMASK_ARITH_EQ = CCMASK_0;
52+
const unsigned CCMASK_ARITH_LT = CCMASK_1;
53+
const unsigned CCMASK_ARITH_GT = CCMASK_2;
54+
const unsigned CCMASK_ARITH_OVERFLOW = CCMASK_3;
55+
const unsigned CCMASK_ARITH = CCMASK_ANY;
56+
57+
// Condition-code mask assignments for logical operations.
58+
const unsigned CCMASK_LOGICAL_ZERO = CCMASK_0 | CCMASK_2;
59+
const unsigned CCMASK_LOGICAL_NONZERO = CCMASK_1 | CCMASK_2;
60+
const unsigned CCMASK_LOGICAL_CARRY = CCMASK_2 | CCMASK_3;
61+
const unsigned CCMASK_LOGICAL_NOCARRY = CCMASK_0 | CCMASK_1;
62+
const unsigned CCMASK_LOGICAL_BORROW = CCMASK_LOGICAL_NOCARRY;
63+
const unsigned CCMASK_LOGICAL_NOBORROW = CCMASK_LOGICAL_CARRY;
64+
const unsigned CCMASK_LOGICAL = CCMASK_ANY;
65+
5066
// Condition-code mask assignments for CS.
5167
const unsigned CCMASK_CS_EQ = CCMASK_0;
5268
const unsigned CCMASK_CS_NE = CCMASK_1;

llvm/lib/Target/SystemZ/SystemZISelDAGToDAG.cpp

+172
Original file line numberDiff line numberDiff line change
@@ -310,6 +310,11 @@ class SystemZDAGToDAGISel : public SelectionDAGISel {
310310
// Try to use scatter instruction Opcode to implement store Store.
311311
bool tryScatter(StoreSDNode *Store, unsigned Opcode);
312312

313+
// Change a chain of {load; op; store} of the same value into a simple op
314+
// through memory of that value, if the uses of the modified value and its
315+
// address are suitable.
316+
bool tryFoldLoadStoreIntoMemOperand(SDNode *Node);
317+
313318
// Return true if Load and Store are loads and stores of the same size
314319
// and are guaranteed not to overlap. Such operations can be implemented
315320
// using block (SS-format) instructions.
@@ -1196,6 +1201,171 @@ bool SystemZDAGToDAGISel::tryScatter(StoreSDNode *Store, unsigned Opcode) {
11961201
return true;
11971202
}
11981203

1204+
// Check whether or not the chain ending in StoreNode is suitable for doing
1205+
// the {load; op; store} to modify transformation.
1206+
static bool isFusableLoadOpStorePattern(StoreSDNode *StoreNode,
1207+
SDValue StoredVal, SelectionDAG *CurDAG,
1208+
LoadSDNode *&LoadNode,
1209+
SDValue &InputChain) {
1210+
// Is the stored value result 0 of the operation?
1211+
if (StoredVal.getResNo() != 0)
1212+
return false;
1213+
1214+
// Are there other uses of the loaded value than the operation?
1215+
if (!StoredVal.getNode()->hasNUsesOfValue(1, 0))
1216+
return false;
1217+
1218+
// Is the store non-extending and non-indexed?
1219+
if (!ISD::isNormalStore(StoreNode) || StoreNode->isNonTemporal())
1220+
return false;
1221+
1222+
SDValue Load = StoredVal->getOperand(0);
1223+
// Is the stored value a non-extending and non-indexed load?
1224+
if (!ISD::isNormalLoad(Load.getNode()))
1225+
return false;
1226+
1227+
// Return LoadNode by reference.
1228+
LoadNode = cast<LoadSDNode>(Load);
1229+
1230+
// Is store the only read of the loaded value?
1231+
if (!Load.hasOneUse())
1232+
return false;
1233+
1234+
// Is the address of the store the same as the load?
1235+
if (LoadNode->getBasePtr() != StoreNode->getBasePtr() ||
1236+
LoadNode->getOffset() != StoreNode->getOffset())
1237+
return false;
1238+
1239+
// Check if the chain is produced by the load or is a TokenFactor with
1240+
// the load output chain as an operand. Return InputChain by reference.
1241+
SDValue Chain = StoreNode->getChain();
1242+
1243+
bool ChainCheck = false;
1244+
if (Chain == Load.getValue(1)) {
1245+
ChainCheck = true;
1246+
InputChain = LoadNode->getChain();
1247+
} else if (Chain.getOpcode() == ISD::TokenFactor) {
1248+
SmallVector<SDValue, 4> ChainOps;
1249+
for (unsigned i = 0, e = Chain.getNumOperands(); i != e; ++i) {
1250+
SDValue Op = Chain.getOperand(i);
1251+
if (Op == Load.getValue(1)) {
1252+
ChainCheck = true;
1253+
// Drop Load, but keep its chain. No cycle check necessary.
1254+
ChainOps.push_back(Load.getOperand(0));
1255+
continue;
1256+
}
1257+
1258+
// Make sure using Op as part of the chain would not cause a cycle here.
1259+
// In theory, we could check whether the chain node is a predecessor of
1260+
// the load. But that can be very expensive. Instead visit the uses and
1261+
// make sure they all have smaller node id than the load.
1262+
int LoadId = LoadNode->getNodeId();
1263+
for (SDNode::use_iterator UI = Op.getNode()->use_begin(),
1264+
UE = UI->use_end(); UI != UE; ++UI) {
1265+
if (UI.getUse().getResNo() != 0)
1266+
continue;
1267+
if (UI->getNodeId() > LoadId)
1268+
return false;
1269+
}
1270+
1271+
ChainOps.push_back(Op);
1272+
}
1273+
1274+
if (ChainCheck)
1275+
// Make a new TokenFactor with all the other input chains except
1276+
// for the load.
1277+
InputChain = CurDAG->getNode(ISD::TokenFactor, SDLoc(Chain),
1278+
MVT::Other, ChainOps);
1279+
}
1280+
if (!ChainCheck)
1281+
return false;
1282+
1283+
return true;
1284+
}
1285+
1286+
// Change a chain of {load; op; store} of the same value into a simple op
1287+
// through memory of that value, if the uses of the modified value and its
1288+
// address are suitable.
1289+
//
1290+
// The tablegen pattern memory operand pattern is currently not able to match
1291+
// the case where the CC on the original operation are used.
1292+
//
1293+
// See the equivalent routine in X86ISelDAGToDAG for further comments.
1294+
bool SystemZDAGToDAGISel::tryFoldLoadStoreIntoMemOperand(SDNode *Node) {
1295+
StoreSDNode *StoreNode = cast<StoreSDNode>(Node);
1296+
SDValue StoredVal = StoreNode->getOperand(1);
1297+
unsigned Opc = StoredVal->getOpcode();
1298+
SDLoc DL(StoreNode);
1299+
1300+
// Before we try to select anything, make sure this is memory operand size
1301+
// and opcode we can handle. Note that this must match the code below that
1302+
// actually lowers the opcodes.
1303+
EVT MemVT = StoreNode->getMemoryVT();
1304+
unsigned NewOpc = 0;
1305+
bool NegateOperand = false;
1306+
switch (Opc) {
1307+
default:
1308+
return false;
1309+
case SystemZISD::SSUBO:
1310+
NegateOperand = true;
1311+
/* fall through */
1312+
case SystemZISD::SADDO:
1313+
if (MemVT == MVT::i32)
1314+
NewOpc = SystemZ::ASI;
1315+
else if (MemVT == MVT::i64)
1316+
NewOpc = SystemZ::AGSI;
1317+
else
1318+
return false;
1319+
break;
1320+
case SystemZISD::USUBO:
1321+
NegateOperand = true;
1322+
/* fall through */
1323+
case SystemZISD::UADDO:
1324+
if (MemVT == MVT::i32)
1325+
NewOpc = SystemZ::ALSI;
1326+
else if (MemVT == MVT::i64)
1327+
NewOpc = SystemZ::ALGSI;
1328+
else
1329+
return false;
1330+
break;
1331+
}
1332+
1333+
LoadSDNode *LoadNode = nullptr;
1334+
SDValue InputChain;
1335+
if (!isFusableLoadOpStorePattern(StoreNode, StoredVal, CurDAG, LoadNode,
1336+
InputChain))
1337+
return false;
1338+
1339+
SDValue Operand = StoredVal.getOperand(1);
1340+
auto *OperandC = dyn_cast<ConstantSDNode>(Operand);
1341+
if (!OperandC)
1342+
return false;
1343+
auto OperandV = OperandC->getAPIntValue();
1344+
if (NegateOperand)
1345+
OperandV = -OperandV;
1346+
if (OperandV.getMinSignedBits() > 8)
1347+
return false;
1348+
Operand = CurDAG->getTargetConstant(OperandV, DL, MemVT);
1349+
1350+
SDValue Base, Disp;
1351+
if (!selectBDAddr20Only(StoreNode->getBasePtr(), Base, Disp))
1352+
return false;
1353+
1354+
SDValue Ops[] = { Base, Disp, Operand, InputChain };
1355+
MachineSDNode *Result =
1356+
CurDAG->getMachineNode(NewOpc, DL, MVT::i32, MVT::Other, Ops);
1357+
1358+
MachineSDNode::mmo_iterator MemOp = MF->allocateMemRefsArray(2);
1359+
MemOp[0] = StoreNode->getMemOperand();
1360+
MemOp[1] = LoadNode->getMemOperand();
1361+
Result->setMemRefs(MemOp, MemOp + 2);
1362+
1363+
ReplaceUses(SDValue(StoreNode, 0), SDValue(Result, 1));
1364+
ReplaceUses(SDValue(StoredVal.getNode(), 1), SDValue(Result, 0));
1365+
CurDAG->RemoveDeadNode(Node);
1366+
return true;
1367+
}
1368+
11991369
bool SystemZDAGToDAGISel::canUseBlockOperation(StoreSDNode *Store,
12001370
LoadSDNode *Load) const {
12011371
// Check that the two memory operands have the same size.
@@ -1358,6 +1528,8 @@ void SystemZDAGToDAGISel::Select(SDNode *Node) {
13581528
}
13591529

13601530
case ISD::STORE: {
1531+
if (tryFoldLoadStoreIntoMemOperand(Node))
1532+
return;
13611533
auto *Store = cast<StoreSDNode>(Node);
13621534
unsigned ElemBitSize = Store->getValue().getValueSizeInBits();
13631535
if (ElemBitSize == 32) {

0 commit comments

Comments
 (0)