Skip to content

Commit c75e454

Browse files
committed
[RISCV] Transform unaligned RVV vector loads/stores to aligned ones
This patch adds support for loading and storing unaligned vectors via an equivalently-sized i8 vector type, which has support in the RVV specification for byte-aligned access. This offers a more optimal path for handling of unaligned fixed-length vector accesses, which are currently scalarized. It also prevents crashing when `LegalizeDAG` sees an unaligned scalable-vector load/store operation. Future work could be to investigate loading/storing via the largest vector element type for the given alignment, in case that would be more optimal on hardware. For instance, a 4-byte-aligned nxv2i64 vector load could loaded as nxv4i32 instead of as nxv16i8. Reviewed By: craig.topper Differential Revision: https://reviews.llvm.org/D104032
1 parent c58cf69 commit c75e454

File tree

4 files changed

+295
-289
lines changed

4 files changed

+295
-289
lines changed

llvm/lib/Target/RISCV/RISCVISelLowering.cpp

+84-13
Original file line numberDiff line numberDiff line change
@@ -523,6 +523,9 @@ RISCVTargetLowering::RISCVTargetLowering(const TargetMachine &TM,
523523
for (unsigned VPOpc : IntegerVPOps)
524524
setOperationAction(VPOpc, VT, Custom);
525525

526+
setOperationAction(ISD::LOAD, VT, Custom);
527+
setOperationAction(ISD::STORE, VT, Custom);
528+
526529
setOperationAction(ISD::MLOAD, VT, Custom);
527530
setOperationAction(ISD::MSTORE, VT, Custom);
528531
setOperationAction(ISD::MGATHER, VT, Custom);
@@ -584,6 +587,9 @@ RISCVTargetLowering::RISCVTargetLowering(const TargetMachine &TM,
584587
setOperationAction(ISD::VECREDUCE_FMAX, VT, Custom);
585588
setOperationAction(ISD::FCOPYSIGN, VT, Legal);
586589

590+
setOperationAction(ISD::LOAD, VT, Custom);
591+
setOperationAction(ISD::STORE, VT, Custom);
592+
587593
setOperationAction(ISD::MLOAD, VT, Custom);
588594
setOperationAction(ISD::MSTORE, VT, Custom);
589595
setOperationAction(ISD::MGATHER, VT, Custom);
@@ -1891,6 +1897,66 @@ static SDValue getRVVFPExtendOrRound(SDValue Op, MVT VT, MVT ContainerVT,
18911897
return DAG.getNode(RVVOpc, DL, ContainerVT, Op, Mask, VL);
18921898
}
18931899

1900+
// While RVV has alignment restrictions, we should always be able to load as a
1901+
// legal equivalently-sized byte-typed vector instead. This method is
1902+
// responsible for re-expressing a ISD::LOAD via a correctly-aligned type. If
1903+
// the load is already correctly-aligned, it returns SDValue().
1904+
SDValue RISCVTargetLowering::expandUnalignedRVVLoad(SDValue Op,
1905+
SelectionDAG &DAG) const {
1906+
auto *Load = cast<LoadSDNode>(Op);
1907+
assert(Load && Load->getMemoryVT().isVector() && "Expected vector load");
1908+
1909+
if (allowsMemoryAccessForAlignment(*DAG.getContext(), DAG.getDataLayout(),
1910+
Load->getMemoryVT(),
1911+
*Load->getMemOperand()))
1912+
return SDValue();
1913+
1914+
SDLoc DL(Op);
1915+
MVT VT = Op.getSimpleValueType();
1916+
unsigned EltSizeBits = VT.getScalarSizeInBits();
1917+
assert((EltSizeBits == 16 || EltSizeBits == 32 || EltSizeBits == 64) &&
1918+
"Unexpected unaligned RVV load type");
1919+
MVT NewVT =
1920+
MVT::getVectorVT(MVT::i8, VT.getVectorElementCount() * (EltSizeBits / 8));
1921+
assert(NewVT.isValid() &&
1922+
"Expecting equally-sized RVV vector types to be legal");
1923+
SDValue L = DAG.getLoad(NewVT, DL, Load->getChain(), Load->getBasePtr(),
1924+
Load->getPointerInfo(), Load->getOriginalAlign(),
1925+
Load->getMemOperand()->getFlags());
1926+
return DAG.getMergeValues({DAG.getBitcast(VT, L), L.getValue(1)}, DL);
1927+
}
1928+
1929+
// While RVV has alignment restrictions, we should always be able to store as a
1930+
// legal equivalently-sized byte-typed vector instead. This method is
1931+
// responsible for re-expressing a ISD::STORE via a correctly-aligned type. It
1932+
// returns SDValue() if the store is already correctly aligned.
1933+
SDValue RISCVTargetLowering::expandUnalignedRVVStore(SDValue Op,
1934+
SelectionDAG &DAG) const {
1935+
auto *Store = cast<StoreSDNode>(Op);
1936+
assert(Store && Store->getValue().getValueType().isVector() &&
1937+
"Expected vector store");
1938+
1939+
if (allowsMemoryAccessForAlignment(*DAG.getContext(), DAG.getDataLayout(),
1940+
Store->getMemoryVT(),
1941+
*Store->getMemOperand()))
1942+
return SDValue();
1943+
1944+
SDLoc DL(Op);
1945+
SDValue StoredVal = Store->getValue();
1946+
MVT VT = StoredVal.getSimpleValueType();
1947+
unsigned EltSizeBits = VT.getScalarSizeInBits();
1948+
assert((EltSizeBits == 16 || EltSizeBits == 32 || EltSizeBits == 64) &&
1949+
"Unexpected unaligned RVV store type");
1950+
MVT NewVT =
1951+
MVT::getVectorVT(MVT::i8, VT.getVectorElementCount() * (EltSizeBits / 8));
1952+
assert(NewVT.isValid() &&
1953+
"Expecting equally-sized RVV vector types to be legal");
1954+
StoredVal = DAG.getBitcast(NewVT, StoredVal);
1955+
return DAG.getStore(Store->getChain(), DL, StoredVal, Store->getBasePtr(),
1956+
Store->getPointerInfo(), Store->getOriginalAlign(),
1957+
Store->getMemOperand()->getFlags());
1958+
}
1959+
18941960
SDValue RISCVTargetLowering::LowerOperation(SDValue Op,
18951961
SelectionDAG &DAG) const {
18961962
switch (Op.getOpcode()) {
@@ -2310,9 +2376,17 @@ SDValue RISCVTargetLowering::LowerOperation(SDValue Op,
23102376
return Vec;
23112377
}
23122378
case ISD::LOAD:
2313-
return lowerFixedLengthVectorLoadToRVV(Op, DAG);
2379+
if (auto V = expandUnalignedRVVLoad(Op, DAG))
2380+
return V;
2381+
if (Op.getValueType().isFixedLengthVector())
2382+
return lowerFixedLengthVectorLoadToRVV(Op, DAG);
2383+
return Op;
23142384
case ISD::STORE:
2315-
return lowerFixedLengthVectorStoreToRVV(Op, DAG);
2385+
if (auto V = expandUnalignedRVVStore(Op, DAG))
2386+
return V;
2387+
if (Op.getOperand(1).getValueType().isFixedLengthVector())
2388+
return lowerFixedLengthVectorStoreToRVV(Op, DAG);
2389+
return Op;
23162390
case ISD::MLOAD:
23172391
return lowerMLOAD(Op, DAG);
23182392
case ISD::MSTORE:
@@ -4031,13 +4105,10 @@ RISCVTargetLowering::lowerFixedLengthVectorLoadToRVV(SDValue Op,
40314105
SDLoc DL(Op);
40324106
auto *Load = cast<LoadSDNode>(Op);
40334107

4034-
if (!allowsMemoryAccessForAlignment(*DAG.getContext(), DAG.getDataLayout(),
4035-
Load->getMemoryVT(),
4036-
*Load->getMemOperand())) {
4037-
SDValue Result, Chain;
4038-
std::tie(Result, Chain) = expandUnalignedLoad(Load, DAG);
4039-
return DAG.getMergeValues({Result, Chain}, DL);
4040-
}
4108+
assert(allowsMemoryAccessForAlignment(*DAG.getContext(), DAG.getDataLayout(),
4109+
Load->getMemoryVT(),
4110+
*Load->getMemOperand()) &&
4111+
"Expecting a correctly-aligned load");
40414112

40424113
MVT VT = Op.getSimpleValueType();
40434114
MVT ContainerVT = getContainerForFixedLengthVector(VT);
@@ -4060,10 +4131,10 @@ RISCVTargetLowering::lowerFixedLengthVectorStoreToRVV(SDValue Op,
40604131
SDLoc DL(Op);
40614132
auto *Store = cast<StoreSDNode>(Op);
40624133

4063-
if (!allowsMemoryAccessForAlignment(*DAG.getContext(), DAG.getDataLayout(),
4064-
Store->getMemoryVT(),
4065-
*Store->getMemOperand()))
4066-
return expandUnalignedStore(Store, DAG);
4134+
assert(allowsMemoryAccessForAlignment(*DAG.getContext(), DAG.getDataLayout(),
4135+
Store->getMemoryVT(),
4136+
*Store->getMemOperand()) &&
4137+
"Expecting a correctly-aligned store");
40674138

40684139
SDValue StoreVal = Store->getValue();
40694140
MVT VT = StoreVal.getSimpleValueType();

llvm/lib/Target/RISCV/RISCVISelLowering.h

+3
Original file line numberDiff line numberDiff line change
@@ -562,6 +562,9 @@ class RISCVTargetLowering : public TargetLowering {
562562
SDValue lowerGET_ROUNDING(SDValue Op, SelectionDAG &DAG) const;
563563
SDValue lowerSET_ROUNDING(SDValue Op, SelectionDAG &DAG) const;
564564

565+
SDValue expandUnalignedRVVLoad(SDValue Op, SelectionDAG &DAG) const;
566+
SDValue expandUnalignedRVVStore(SDValue Op, SelectionDAG &DAG) const;
567+
565568
bool isEligibleForTailCallOptimization(
566569
CCState &CCInfo, CallLoweringInfo &CLI, MachineFunction &MF,
567570
const SmallVector<CCValAssign, 16> &ArgLocs) const;

0 commit comments

Comments
 (0)