@@ -310,6 +310,11 @@ class SystemZDAGToDAGISel : public SelectionDAGISel {
310
310
// Try to use scatter instruction Opcode to implement store Store.
311
311
bool tryScatter (StoreSDNode *Store, unsigned Opcode);
312
312
313
+ // Change a chain of {load; op; store} of the same value into a simple op
314
+ // through memory of that value, if the uses of the modified value and its
315
+ // address are suitable.
316
+ bool tryFoldLoadStoreIntoMemOperand (SDNode *Node);
317
+
313
318
// Return true if Load and Store are loads and stores of the same size
314
319
// and are guaranteed not to overlap. Such operations can be implemented
315
320
// using block (SS-format) instructions.
@@ -1196,6 +1201,171 @@ bool SystemZDAGToDAGISel::tryScatter(StoreSDNode *Store, unsigned Opcode) {
1196
1201
return true ;
1197
1202
}
1198
1203
1204
+ // Check whether or not the chain ending in StoreNode is suitable for doing
1205
+ // the {load; op; store} to modify transformation.
1206
+ static bool isFusableLoadOpStorePattern (StoreSDNode *StoreNode,
1207
+ SDValue StoredVal, SelectionDAG *CurDAG,
1208
+ LoadSDNode *&LoadNode,
1209
+ SDValue &InputChain) {
1210
+ // Is the stored value result 0 of the operation?
1211
+ if (StoredVal.getResNo () != 0 )
1212
+ return false ;
1213
+
1214
+ // Are there other uses of the loaded value than the operation?
1215
+ if (!StoredVal.getNode ()->hasNUsesOfValue (1 , 0 ))
1216
+ return false ;
1217
+
1218
+ // Is the store non-extending and non-indexed?
1219
+ if (!ISD::isNormalStore (StoreNode) || StoreNode->isNonTemporal ())
1220
+ return false ;
1221
+
1222
+ SDValue Load = StoredVal->getOperand (0 );
1223
+ // Is the stored value a non-extending and non-indexed load?
1224
+ if (!ISD::isNormalLoad (Load.getNode ()))
1225
+ return false ;
1226
+
1227
+ // Return LoadNode by reference.
1228
+ LoadNode = cast<LoadSDNode>(Load);
1229
+
1230
+ // Is store the only read of the loaded value?
1231
+ if (!Load.hasOneUse ())
1232
+ return false ;
1233
+
1234
+ // Is the address of the store the same as the load?
1235
+ if (LoadNode->getBasePtr () != StoreNode->getBasePtr () ||
1236
+ LoadNode->getOffset () != StoreNode->getOffset ())
1237
+ return false ;
1238
+
1239
+ // Check if the chain is produced by the load or is a TokenFactor with
1240
+ // the load output chain as an operand. Return InputChain by reference.
1241
+ SDValue Chain = StoreNode->getChain ();
1242
+
1243
+ bool ChainCheck = false ;
1244
+ if (Chain == Load.getValue (1 )) {
1245
+ ChainCheck = true ;
1246
+ InputChain = LoadNode->getChain ();
1247
+ } else if (Chain.getOpcode () == ISD::TokenFactor) {
1248
+ SmallVector<SDValue, 4 > ChainOps;
1249
+ for (unsigned i = 0 , e = Chain.getNumOperands (); i != e; ++i) {
1250
+ SDValue Op = Chain.getOperand (i);
1251
+ if (Op == Load.getValue (1 )) {
1252
+ ChainCheck = true ;
1253
+ // Drop Load, but keep its chain. No cycle check necessary.
1254
+ ChainOps.push_back (Load.getOperand (0 ));
1255
+ continue ;
1256
+ }
1257
+
1258
+ // Make sure using Op as part of the chain would not cause a cycle here.
1259
+ // In theory, we could check whether the chain node is a predecessor of
1260
+ // the load. But that can be very expensive. Instead visit the uses and
1261
+ // make sure they all have smaller node id than the load.
1262
+ int LoadId = LoadNode->getNodeId ();
1263
+ for (SDNode::use_iterator UI = Op.getNode ()->use_begin (),
1264
+ UE = UI->use_end (); UI != UE; ++UI) {
1265
+ if (UI.getUse ().getResNo () != 0 )
1266
+ continue ;
1267
+ if (UI->getNodeId () > LoadId)
1268
+ return false ;
1269
+ }
1270
+
1271
+ ChainOps.push_back (Op);
1272
+ }
1273
+
1274
+ if (ChainCheck)
1275
+ // Make a new TokenFactor with all the other input chains except
1276
+ // for the load.
1277
+ InputChain = CurDAG->getNode (ISD::TokenFactor, SDLoc (Chain),
1278
+ MVT::Other, ChainOps);
1279
+ }
1280
+ if (!ChainCheck)
1281
+ return false ;
1282
+
1283
+ return true ;
1284
+ }
1285
+
1286
+ // Change a chain of {load; op; store} of the same value into a simple op
1287
+ // through memory of that value, if the uses of the modified value and its
1288
+ // address are suitable.
1289
+ //
1290
+ // The tablegen pattern memory operand pattern is currently not able to match
1291
+ // the case where the CC on the original operation are used.
1292
+ //
1293
+ // See the equivalent routine in X86ISelDAGToDAG for further comments.
1294
+ bool SystemZDAGToDAGISel::tryFoldLoadStoreIntoMemOperand (SDNode *Node) {
1295
+ StoreSDNode *StoreNode = cast<StoreSDNode>(Node);
1296
+ SDValue StoredVal = StoreNode->getOperand (1 );
1297
+ unsigned Opc = StoredVal->getOpcode ();
1298
+ SDLoc DL (StoreNode);
1299
+
1300
+ // Before we try to select anything, make sure this is memory operand size
1301
+ // and opcode we can handle. Note that this must match the code below that
1302
+ // actually lowers the opcodes.
1303
+ EVT MemVT = StoreNode->getMemoryVT ();
1304
+ unsigned NewOpc = 0 ;
1305
+ bool NegateOperand = false ;
1306
+ switch (Opc) {
1307
+ default :
1308
+ return false ;
1309
+ case SystemZISD::SSUBO:
1310
+ NegateOperand = true ;
1311
+ /* fall through */
1312
+ case SystemZISD::SADDO:
1313
+ if (MemVT == MVT::i32)
1314
+ NewOpc = SystemZ::ASI;
1315
+ else if (MemVT == MVT::i64)
1316
+ NewOpc = SystemZ::AGSI;
1317
+ else
1318
+ return false ;
1319
+ break ;
1320
+ case SystemZISD::USUBO:
1321
+ NegateOperand = true ;
1322
+ /* fall through */
1323
+ case SystemZISD::UADDO:
1324
+ if (MemVT == MVT::i32)
1325
+ NewOpc = SystemZ::ALSI;
1326
+ else if (MemVT == MVT::i64)
1327
+ NewOpc = SystemZ::ALGSI;
1328
+ else
1329
+ return false ;
1330
+ break ;
1331
+ }
1332
+
1333
+ LoadSDNode *LoadNode = nullptr ;
1334
+ SDValue InputChain;
1335
+ if (!isFusableLoadOpStorePattern (StoreNode, StoredVal, CurDAG, LoadNode,
1336
+ InputChain))
1337
+ return false ;
1338
+
1339
+ SDValue Operand = StoredVal.getOperand (1 );
1340
+ auto *OperandC = dyn_cast<ConstantSDNode>(Operand);
1341
+ if (!OperandC)
1342
+ return false ;
1343
+ auto OperandV = OperandC->getAPIntValue ();
1344
+ if (NegateOperand)
1345
+ OperandV = -OperandV;
1346
+ if (OperandV.getMinSignedBits () > 8 )
1347
+ return false ;
1348
+ Operand = CurDAG->getTargetConstant (OperandV, DL, MemVT);
1349
+
1350
+ SDValue Base, Disp;
1351
+ if (!selectBDAddr20Only (StoreNode->getBasePtr (), Base, Disp))
1352
+ return false ;
1353
+
1354
+ SDValue Ops[] = { Base, Disp, Operand, InputChain };
1355
+ MachineSDNode *Result =
1356
+ CurDAG->getMachineNode (NewOpc, DL, MVT::i32, MVT::Other, Ops);
1357
+
1358
+ MachineSDNode::mmo_iterator MemOp = MF->allocateMemRefsArray (2 );
1359
+ MemOp[0 ] = StoreNode->getMemOperand ();
1360
+ MemOp[1 ] = LoadNode->getMemOperand ();
1361
+ Result->setMemRefs (MemOp, MemOp + 2 );
1362
+
1363
+ ReplaceUses (SDValue (StoreNode, 0 ), SDValue (Result, 1 ));
1364
+ ReplaceUses (SDValue (StoredVal.getNode (), 1 ), SDValue (Result, 0 ));
1365
+ CurDAG->RemoveDeadNode (Node);
1366
+ return true ;
1367
+ }
1368
+
1199
1369
bool SystemZDAGToDAGISel::canUseBlockOperation (StoreSDNode *Store,
1200
1370
LoadSDNode *Load) const {
1201
1371
// Check that the two memory operands have the same size.
@@ -1358,6 +1528,8 @@ void SystemZDAGToDAGISel::Select(SDNode *Node) {
1358
1528
}
1359
1529
1360
1530
case ISD::STORE: {
1531
+ if (tryFoldLoadStoreIntoMemOperand (Node))
1532
+ return ;
1361
1533
auto *Store = cast<StoreSDNode>(Node);
1362
1534
unsigned ElemBitSize = Store->getValue ().getValueSizeInBits ();
1363
1535
if (ElemBitSize == 32 ) {
0 commit comments