@@ -4625,6 +4625,9 @@ void DAGTypeLegalizer::WidenVectorResult(SDNode *N, unsigned ResNo) {
4625
4625
break ;
4626
4626
case ISD::EXTRACT_SUBVECTOR: Res = WidenVecRes_EXTRACT_SUBVECTOR (N); break ;
4627
4627
case ISD::INSERT_VECTOR_ELT: Res = WidenVecRes_INSERT_VECTOR_ELT (N); break ;
4628
+ case ISD::ATOMIC_LOAD:
4629
+ Res = WidenVecRes_ATOMIC_LOAD (cast<AtomicSDNode>(N));
4630
+ break ;
4628
4631
case ISD::LOAD: Res = WidenVecRes_LOAD (N); break ;
4629
4632
case ISD::STEP_VECTOR:
4630
4633
case ISD::SPLAT_VECTOR:
@@ -6014,6 +6017,74 @@ SDValue DAGTypeLegalizer::WidenVecRes_INSERT_VECTOR_ELT(SDNode *N) {
6014
6017
N->getOperand (1 ), N->getOperand (2 ));
6015
6018
}
6016
6019
6020
+ // / Either return the same load or provide appropriate casts
6021
+ // / from the load and return that.
6022
+ static SDValue coerceLoadedValue (SDValue LdOp, EVT FirstVT, EVT WidenVT,
6023
+ TypeSize LdWidth, TypeSize FirstVTWidth,
6024
+ SDLoc dl, SelectionDAG &DAG) {
6025
+ assert (TypeSize::isKnownLE (LdWidth, FirstVTWidth));
6026
+ TypeSize WidenWidth = WidenVT.getSizeInBits ();
6027
+ if (!FirstVT.isVector ()) {
6028
+ unsigned NumElts =
6029
+ WidenWidth.getFixedValue () / FirstVTWidth.getFixedValue ();
6030
+ EVT NewVecVT = EVT::getVectorVT (*DAG.getContext (), FirstVT, NumElts);
6031
+ SDValue VecOp = DAG.getNode (ISD::SCALAR_TO_VECTOR, dl, NewVecVT, LdOp);
6032
+ return DAG.getNode (ISD::BITCAST, dl, WidenVT, VecOp);
6033
+ }
6034
+ assert (FirstVT == WidenVT);
6035
+ return LdOp;
6036
+ }
6037
+
6038
+ static std::optional<EVT> findMemType (SelectionDAG &DAG,
6039
+ const TargetLowering &TLI, unsigned Width,
6040
+ EVT WidenVT, unsigned Align,
6041
+ unsigned WidenEx);
6042
+
6043
+ SDValue DAGTypeLegalizer::WidenVecRes_ATOMIC_LOAD (AtomicSDNode *LD) {
6044
+ EVT WidenVT =
6045
+ TLI.getTypeToTransformTo (*DAG.getContext (), LD->getValueType (0 ));
6046
+ EVT LdVT = LD->getMemoryVT ();
6047
+ SDLoc dl (LD);
6048
+ assert (LdVT.isVector () && WidenVT.isVector () && " Expected vectors" );
6049
+ assert (LdVT.isScalableVector () == WidenVT.isScalableVector () &&
6050
+ " Must be scalable" );
6051
+ assert (LdVT.getVectorElementType () == WidenVT.getVectorElementType () &&
6052
+ " Expected equivalent element types" );
6053
+
6054
+ // Load information
6055
+ SDValue Chain = LD->getChain ();
6056
+ SDValue BasePtr = LD->getBasePtr ();
6057
+ MachineMemOperand::Flags MMOFlags = LD->getMemOperand ()->getFlags ();
6058
+ AAMDNodes AAInfo = LD->getAAInfo ();
6059
+
6060
+ TypeSize LdWidth = LdVT.getSizeInBits ();
6061
+ TypeSize WidenWidth = WidenVT.getSizeInBits ();
6062
+ TypeSize WidthDiff = WidenWidth - LdWidth;
6063
+
6064
+ // Find the vector type that can load from.
6065
+ std::optional<EVT> FirstVT =
6066
+ findMemType (DAG, TLI, LdWidth.getKnownMinValue (), WidenVT, /* LdAlign=*/ 0 ,
6067
+ WidthDiff.getKnownMinValue ());
6068
+
6069
+ if (!FirstVT)
6070
+ return SDValue ();
6071
+
6072
+ SmallVector<EVT, 8 > MemVTs;
6073
+ TypeSize FirstVTWidth = FirstVT->getSizeInBits ();
6074
+
6075
+ SDValue LdOp = DAG.getAtomicLoad (ISD::NON_EXTLOAD, dl, *FirstVT, *FirstVT,
6076
+ Chain, BasePtr, LD->getMemOperand ());
6077
+
6078
+ // Load the element with one instruction.
6079
+ SDValue Result = coerceLoadedValue (LdOp, *FirstVT, WidenVT, LdWidth,
6080
+ FirstVTWidth, dl, DAG);
6081
+
6082
+ // Modified the chain - switch anything that used the old chain to use
6083
+ // the new one.
6084
+ ReplaceValueWith (SDValue (LD, 1 ), LdOp.getValue (1 ));
6085
+ return Result;
6086
+ }
6087
+
6017
6088
SDValue DAGTypeLegalizer::WidenVecRes_LOAD (SDNode *N) {
6018
6089
LoadSDNode *LD = cast<LoadSDNode>(N);
6019
6090
ISD::LoadExtType ExtType = LD->getExtensionType ();
@@ -7896,29 +7967,9 @@ SDValue DAGTypeLegalizer::GenWidenVectorLoads(SmallVectorImpl<SDValue> &LdChain,
7896
7967
LdChain.push_back (LdOp.getValue (1 ));
7897
7968
7898
7969
// Check if we can load the element with one instruction.
7899
- if (MemVTs.empty ()) {
7900
- assert (TypeSize::isKnownLE (LdWidth, FirstVTWidth));
7901
- if (!FirstVT->isVector ()) {
7902
- unsigned NumElts =
7903
- WidenWidth.getFixedValue () / FirstVTWidth.getFixedValue ();
7904
- EVT NewVecVT = EVT::getVectorVT (*DAG.getContext (), *FirstVT, NumElts);
7905
- SDValue VecOp = DAG.getNode (ISD::SCALAR_TO_VECTOR, dl, NewVecVT, LdOp);
7906
- return DAG.getNode (ISD::BITCAST, dl, WidenVT, VecOp);
7907
- }
7908
- if (FirstVT == WidenVT)
7909
- return LdOp;
7910
-
7911
- // TODO: We don't currently have any tests that exercise this code path.
7912
- assert (WidenWidth.getFixedValue () % FirstVTWidth.getFixedValue () == 0 );
7913
- unsigned NumConcat =
7914
- WidenWidth.getFixedValue () / FirstVTWidth.getFixedValue ();
7915
- SmallVector<SDValue, 16 > ConcatOps (NumConcat);
7916
- SDValue UndefVal = DAG.getUNDEF (*FirstVT);
7917
- ConcatOps[0 ] = LdOp;
7918
- for (unsigned i = 1 ; i != NumConcat; ++i)
7919
- ConcatOps[i] = UndefVal;
7920
- return DAG.getNode (ISD::CONCAT_VECTORS, dl, WidenVT, ConcatOps);
7921
- }
7970
+ if (MemVTs.empty ())
7971
+ return coerceLoadedValue (LdOp, *FirstVT, WidenVT, LdWidth, FirstVTWidth, dl,
7972
+ DAG);
7922
7973
7923
7974
// Load vector by using multiple loads from largest vector to scalar.
7924
7975
SmallVector<SDValue, 16 > LdOps;
0 commit comments