@@ -3525,7 +3525,7 @@ convertMLOADToLoadWithUsedBytesMask(MemSDNode *N, SelectionDAG &DAG) {
35253525 uint32_t ElementSizeInBytes = ElementSizeInBits / 8 ;
35263526 uint32_t ElementMask = (1u << ElementSizeInBytes) - 1u ;
35273527
3528- for (SDValue Op : llvm:: reverse (Mask->ops ())) {
3528+ for (SDValue Op : reverse (Mask->ops ())) {
35293529 // We technically only want to do this shift for every
35303530 // iteration *but* the first, but in the first iteration NewMask is 0, so
35313531 // this shift is a no-op.
@@ -3714,8 +3714,7 @@ SDValue NVPTXTargetLowering::LowerMLOAD(SDValue Op, SelectionDAG &DAG) const {
37143714 // will validate alignment. Therefore, we do not need to special case handle
37153715 // them here.
37163716 EVT VT = Op.getValueType ();
3717- if (NVPTX::isPackedVectorTy (VT) &&
3718- (VT != MVT::v2f32 || STI.hasF32x2Instructions ())) {
3717+ if (NVPTX::isPackedVectorTy (VT)) {
37193718 auto Result =
37203719 convertMLOADToLoadWithUsedBytesMask (cast<MemSDNode>(Op.getNode ()), DAG);
37213720 MemSDNode *LD = std::get<0 >(Result);
@@ -5656,7 +5655,6 @@ combineUnpackingMovIntoLoad(SDNode *N, TargetLowering::DAGCombinerInfo &DCI) {
56565655 Operands.push_back (DCI.DAG .getIntPtrConstant (
56575656 cast<LoadSDNode>(LD)->getExtensionType (), DL));
56585657 break ;
5659- // TODO do we need to support MLoadV1 here?
56605658 case NVPTXISD::LoadV2:
56615659 OldNumOutputs = 2 ;
56625660 Opcode = NVPTXISD::LoadV4;
0 commit comments