@@ -4625,6 +4625,9 @@ void DAGTypeLegalizer::WidenVectorResult(SDNode *N, unsigned ResNo) {
46254625 break ;
46264626 case ISD::EXTRACT_SUBVECTOR: Res = WidenVecRes_EXTRACT_SUBVECTOR (N); break ;
46274627 case ISD::INSERT_VECTOR_ELT: Res = WidenVecRes_INSERT_VECTOR_ELT (N); break ;
4628+ case ISD::ATOMIC_LOAD:
4629+ Res = WidenVecRes_ATOMIC_LOAD (cast<AtomicSDNode>(N));
4630+ break ;
46284631 case ISD::LOAD: Res = WidenVecRes_LOAD (N); break ;
46294632 case ISD::STEP_VECTOR:
46304633 case ISD::SPLAT_VECTOR:
@@ -6014,6 +6017,74 @@ SDValue DAGTypeLegalizer::WidenVecRes_INSERT_VECTOR_ELT(SDNode *N) {
60146017 N->getOperand (1 ), N->getOperand (2 ));
60156018}
60166019
6020+ // / Either return the same load or provide appropriate casts
6021+ // / from the load and return that.
6022+ static SDValue coerceLoadedValue (SDValue LdOp, EVT FirstVT, EVT WidenVT,
6023+ TypeSize LdWidth, TypeSize FirstVTWidth,
6024+ SDLoc dl, SelectionDAG &DAG) {
6025+ assert (TypeSize::isKnownLE (LdWidth, FirstVTWidth));
6026+ TypeSize WidenWidth = WidenVT.getSizeInBits ();
6027+ if (!FirstVT.isVector ()) {
6028+ unsigned NumElts =
6029+ WidenWidth.getFixedValue () / FirstVTWidth.getFixedValue ();
6030+ EVT NewVecVT = EVT::getVectorVT (*DAG.getContext (), FirstVT, NumElts);
6031+ SDValue VecOp = DAG.getNode (ISD::SCALAR_TO_VECTOR, dl, NewVecVT, LdOp);
6032+ return DAG.getNode (ISD::BITCAST, dl, WidenVT, VecOp);
6033+ }
6034+ assert (FirstVT == WidenVT);
6035+ return LdOp;
6036+ }
6037+
6038+ static std::optional<EVT> findMemType (SelectionDAG &DAG,
6039+ const TargetLowering &TLI, unsigned Width,
6040+ EVT WidenVT, unsigned Align,
6041+ unsigned WidenEx);
6042+
6043+ SDValue DAGTypeLegalizer::WidenVecRes_ATOMIC_LOAD (AtomicSDNode *LD) {
6044+ EVT WidenVT =
6045+ TLI.getTypeToTransformTo (*DAG.getContext (), LD->getValueType (0 ));
6046+ EVT LdVT = LD->getMemoryVT ();
6047+ SDLoc dl (LD);
6048+ assert (LdVT.isVector () && WidenVT.isVector () && " Expected vectors" );
6049+ assert (LdVT.isScalableVector () == WidenVT.isScalableVector () &&
6050+ " Must be scalable" );
6051+ assert (LdVT.getVectorElementType () == WidenVT.getVectorElementType () &&
6052+ " Expected equivalent element types" );
6053+
6054+ // Load information
6055+ SDValue Chain = LD->getChain ();
6056+ SDValue BasePtr = LD->getBasePtr ();
6057+ MachineMemOperand::Flags MMOFlags = LD->getMemOperand ()->getFlags ();
6058+ AAMDNodes AAInfo = LD->getAAInfo ();
6059+
6060+ TypeSize LdWidth = LdVT.getSizeInBits ();
6061+ TypeSize WidenWidth = WidenVT.getSizeInBits ();
6062+ TypeSize WidthDiff = WidenWidth - LdWidth;
6063+
6064+ // Find the vector type that can load from.
6065+ std::optional<EVT> FirstVT =
6066+ findMemType (DAG, TLI, LdWidth.getKnownMinValue (), WidenVT, /* LdAlign=*/ 0 ,
6067+ WidthDiff.getKnownMinValue ());
6068+
6069+ if (!FirstVT)
6070+ return SDValue ();
6071+
6072+ SmallVector<EVT, 8 > MemVTs;
6073+ TypeSize FirstVTWidth = FirstVT->getSizeInBits ();
6074+
6075+ SDValue LdOp = DAG.getAtomicLoad (ISD::NON_EXTLOAD, dl, *FirstVT, *FirstVT,
6076+ Chain, BasePtr, LD->getMemOperand ());
6077+
6078+ // Load the element with one instruction.
6079+ SDValue Result = coerceLoadedValue (LdOp, *FirstVT, WidenVT, LdWidth,
6080+ FirstVTWidth, dl, DAG);
6081+
6082+ // Modified the chain - switch anything that used the old chain to use
6083+ // the new one.
6084+ ReplaceValueWith (SDValue (LD, 1 ), LdOp.getValue (1 ));
6085+ return Result;
6086+ }
6087+
60176088SDValue DAGTypeLegalizer::WidenVecRes_LOAD (SDNode *N) {
60186089 LoadSDNode *LD = cast<LoadSDNode>(N);
60196090 ISD::LoadExtType ExtType = LD->getExtensionType ();
@@ -7896,29 +7967,9 @@ SDValue DAGTypeLegalizer::GenWidenVectorLoads(SmallVectorImpl<SDValue> &LdChain,
78967967 LdChain.push_back (LdOp.getValue (1 ));
78977968
78987969 // Check if we can load the element with one instruction.
7899- if (MemVTs.empty ()) {
7900- assert (TypeSize::isKnownLE (LdWidth, FirstVTWidth));
7901- if (!FirstVT->isVector ()) {
7902- unsigned NumElts =
7903- WidenWidth.getFixedValue () / FirstVTWidth.getFixedValue ();
7904- EVT NewVecVT = EVT::getVectorVT (*DAG.getContext (), *FirstVT, NumElts);
7905- SDValue VecOp = DAG.getNode (ISD::SCALAR_TO_VECTOR, dl, NewVecVT, LdOp);
7906- return DAG.getNode (ISD::BITCAST, dl, WidenVT, VecOp);
7907- }
7908- if (FirstVT == WidenVT)
7909- return LdOp;
7910-
7911- // TODO: We don't currently have any tests that exercise this code path.
7912- assert (WidenWidth.getFixedValue () % FirstVTWidth.getFixedValue () == 0 );
7913- unsigned NumConcat =
7914- WidenWidth.getFixedValue () / FirstVTWidth.getFixedValue ();
7915- SmallVector<SDValue, 16 > ConcatOps (NumConcat);
7916- SDValue UndefVal = DAG.getUNDEF (*FirstVT);
7917- ConcatOps[0 ] = LdOp;
7918- for (unsigned i = 1 ; i != NumConcat; ++i)
7919- ConcatOps[i] = UndefVal;
7920- return DAG.getNode (ISD::CONCAT_VECTORS, dl, WidenVT, ConcatOps);
7921- }
7970+ if (MemVTs.empty ())
7971+ return coerceLoadedValue (LdOp, *FirstVT, WidenVT, LdWidth, FirstVTWidth, dl,
7972+ DAG);
79227973
79237974 // Load vector by using multiple loads from largest vector to scalar.
79247975 SmallVector<SDValue, 16 > LdOps;
0 commit comments