- 
                Notifications
    You must be signed in to change notification settings 
- Fork 15k
Revert "[WebAssembly] Lower fmuladd to madd and nmadd" #163171
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
          
     Merged
      
        
      
    
                
     Merged
            
            
          Conversation
  
    
      This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
      Learn more about bidirectional Unicode characters
    
  
  
    
    This reverts commit a4eb7ea.
| @llvm/pr-subscribers-llvm-selectiondag @llvm/pr-subscribers-backend-webassembly Author: Sam Parker (sparker-arm) ChangesReverts llvm/llvm-project#161355 Looks like I've broken some intrinsic code generation. Patch is 85.26 KiB, truncated to 20.00 KiB below, full version: https://github.com/llvm/llvm-project/pull/163171.diff 14 Files Affected: 
 diff --git a/llvm/include/llvm/CodeGen/ISDOpcodes.h b/llvm/include/llvm/CodeGen/ISDOpcodes.h
index ff3dd0d4c3c51..c76c83d84b3c7 100644
--- a/llvm/include/llvm/CodeGen/ISDOpcodes.h
+++ b/llvm/include/llvm/CodeGen/ISDOpcodes.h
@@ -514,12 +514,6 @@ enum NodeType {
   /// separately rounded operations.
   FMAD,
 
-  /// FMULADD - Performs a * b + c, with, or without, intermediate rounding.
-  /// It is expected that this will be illegal for most targets, as it usually
-  /// makes sense to split this or use an FMA. But some targets, such as
-  /// WebAssembly, can directly support these semantics.
-  FMULADD,
-
   /// FCOPYSIGN(X, Y) - Return the value of X with the sign of Y.  NOTE: This
   /// DAG node does not require that X and Y have the same type, just that
   /// they are both floating point.  X and the result must have the same type.
diff --git a/llvm/include/llvm/Target/TargetSelectionDAG.td b/llvm/include/llvm/Target/TargetSelectionDAG.td
index 07a858fd682fc..632be7ad9e350 100644
--- a/llvm/include/llvm/Target/TargetSelectionDAG.td
+++ b/llvm/include/llvm/Target/TargetSelectionDAG.td
@@ -535,7 +535,6 @@ def fdiv       : SDNode<"ISD::FDIV"       , SDTFPBinOp>;
 def frem       : SDNode<"ISD::FREM"       , SDTFPBinOp>;
 def fma        : SDNode<"ISD::FMA"        , SDTFPTernaryOp, [SDNPCommutative]>;
 def fmad       : SDNode<"ISD::FMAD"       , SDTFPTernaryOp, [SDNPCommutative]>;
-def fmuladd    : SDNode<"ISD::FMULADD"    , SDTFPTernaryOp, [SDNPCommutative]>;
 def fabs       : SDNode<"ISD::FABS"       , SDTFPUnaryOp>;
 def fminnum    : SDNode<"ISD::FMINNUM"    , SDTFPBinOp,
                                   [SDNPCommutative, SDNPAssociative]>;
diff --git a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
index e15384202f758..b1accdd066dfd 100644
--- a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
@@ -509,7 +509,6 @@ namespace {
     SDValue visitFMUL(SDNode *N);
     template <class MatchContextClass> SDValue visitFMA(SDNode *N);
     SDValue visitFMAD(SDNode *N);
-    SDValue visitFMULADD(SDNode *N);
     SDValue visitFDIV(SDNode *N);
     SDValue visitFREM(SDNode *N);
     SDValue visitFSQRT(SDNode *N);
@@ -1992,7 +1991,6 @@ SDValue DAGCombiner::visit(SDNode *N) {
   case ISD::FMUL:               return visitFMUL(N);
   case ISD::FMA:                return visitFMA<EmptyMatchContext>(N);
   case ISD::FMAD:               return visitFMAD(N);
-  case ISD::FMULADD:            return visitFMULADD(N);
   case ISD::FDIV:               return visitFDIV(N);
   case ISD::FREM:               return visitFREM(N);
   case ISD::FSQRT:              return visitFSQRT(N);
@@ -18446,21 +18444,6 @@ SDValue DAGCombiner::visitFMAD(SDNode *N) {
   return SDValue();
 }
 
-SDValue DAGCombiner::visitFMULADD(SDNode *N) {
-  SDValue N0 = N->getOperand(0);
-  SDValue N1 = N->getOperand(1);
-  SDValue N2 = N->getOperand(2);
-  EVT VT = N->getValueType(0);
-  SDLoc DL(N);
-
-  // Constant fold FMULADD.
-  if (SDValue C =
-          DAG.FoldConstantArithmetic(ISD::FMULADD, DL, VT, {N0, N1, N2}))
-    return C;
-
-  return SDValue();
-}
-
 // Combine multiple FDIVs with the same divisor into multiple FMULs by the
 // reciprocal.
 // E.g., (a / D; b / D;) -> (recip = 1.0 / D; a * recip; b * recip)
diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
index c1fd052d01f31..08af74c258899 100644
--- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
@@ -5786,7 +5786,6 @@ bool SelectionDAG::canCreateUndefOrPoison(SDValue Op, const APInt &DemandedElts,
   case ISD::FCOPYSIGN:
   case ISD::FMA:
   case ISD::FMAD:
-  case ISD::FMULADD:
   case ISD::FP_EXTEND:
   case ISD::FP_TO_SINT_SAT:
   case ISD::FP_TO_UINT_SAT:
@@ -5905,7 +5904,6 @@ bool SelectionDAG::isKnownNeverNaN(SDValue Op, const APInt &DemandedElts,
   case ISD::FCOSH:
   case ISD::FTANH:
   case ISD::FMA:
-  case ISD::FMULADD:
   case ISD::FMAD: {
     if (SNaN)
       return true;
@@ -7233,7 +7231,7 @@ SDValue SelectionDAG::FoldConstantArithmetic(unsigned Opcode, const SDLoc &DL,
   }
 
   // Handle fma/fmad special cases.
-  if (Opcode == ISD::FMA || Opcode == ISD::FMAD || Opcode == ISD::FMULADD) {
+  if (Opcode == ISD::FMA || Opcode == ISD::FMAD) {
     assert(VT.isFloatingPoint() && "This operator only applies to FP types!");
     assert(Ops[0].getValueType() == VT && Ops[1].getValueType() == VT &&
            Ops[2].getValueType() == VT && "FMA types must match!");
@@ -7244,7 +7242,7 @@ SDValue SelectionDAG::FoldConstantArithmetic(unsigned Opcode, const SDLoc &DL,
       APFloat V1 = C1->getValueAPF();
       const APFloat &V2 = C2->getValueAPF();
       const APFloat &V3 = C3->getValueAPF();
-      if (Opcode == ISD::FMAD || Opcode == ISD::FMULADD) {
+      if (Opcode == ISD::FMAD) {
         V1.multiply(V2, APFloat::rmNearestTiesToEven);
         V1.add(V3, APFloat::rmNearestTiesToEven);
       } else
diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
index 0f2b5188fc10a..c21890a0d856f 100644
--- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
@@ -6996,13 +6996,6 @@ void SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I,
                                getValue(I.getArgOperand(0)),
                                getValue(I.getArgOperand(1)),
                                getValue(I.getArgOperand(2)), Flags));
-    } else if (TLI.isOperationLegalOrCustom(ISD::FMULADD, VT)) {
-      // TODO: Support splitting the vector.
-      setValue(&I, DAG.getNode(ISD::FMULADD, sdl,
-                               getValue(I.getArgOperand(0)).getValueType(),
-                               getValue(I.getArgOperand(0)),
-                               getValue(I.getArgOperand(1)),
-                               getValue(I.getArgOperand(2)), Flags));
     } else {
       // TODO: Intrinsic calls should have fast-math-flags.
       SDValue Mul = DAG.getNode(
diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp
index 39cbfad6d0be1..fcfbfe6c461d3 100644
--- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp
@@ -310,7 +310,6 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
   case ISD::FMA:                        return "fma";
   case ISD::STRICT_FMA:                 return "strict_fma";
   case ISD::FMAD:                       return "fmad";
-  case ISD::FMULADD:                    return "fmuladd";
   case ISD::FREM:                       return "frem";
   case ISD::STRICT_FREM:                return "strict_frem";
   case ISD::FCOPYSIGN:                  return "fcopysign";
diff --git a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp
index 920dff935daed..cc503d324e74b 100644
--- a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -7676,7 +7676,6 @@ SDValue TargetLowering::getNegatedExpression(SDValue Op, SelectionDAG &DAG,
     break;
   }
   case ISD::FMA:
-  case ISD::FMULADD:
   case ISD::FMAD: {
     if (!Flags.hasNoSignedZeros())
       break;
diff --git a/llvm/lib/CodeGen/TargetLoweringBase.cpp b/llvm/lib/CodeGen/TargetLoweringBase.cpp
index 060b1ddc2ef39..c23281a820b2b 100644
--- a/llvm/lib/CodeGen/TargetLoweringBase.cpp
+++ b/llvm/lib/CodeGen/TargetLoweringBase.cpp
@@ -815,8 +815,7 @@ void TargetLoweringBase::initActions() {
                         ISD::FTAN,           ISD::FACOS,
                         ISD::FASIN,          ISD::FATAN,
                         ISD::FCOSH,          ISD::FSINH,
-                        ISD::FTANH,          ISD::FATAN2,
-                        ISD::FMULADD},
+                        ISD::FTANH,          ISD::FATAN2},
                        VT, Expand);
 
     // Overflow operations default to expand
diff --git a/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.cpp b/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.cpp
index 47c24fc27f1d6..64723340051b8 100644
--- a/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.cpp
+++ b/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.cpp
@@ -317,15 +317,6 @@ WebAssemblyTargetLowering::WebAssemblyTargetLowering(
       setOperationAction(ISD::ZERO_EXTEND_VECTOR_INREG, T, Custom);
     }
 
-    if (Subtarget->hasFP16()) {
-      setOperationAction(ISD::FMA, MVT::v8f16, Legal);
-    }
-
-    if (Subtarget->hasRelaxedSIMD()) {
-      setOperationAction(ISD::FMULADD, MVT::v4f32, Legal);
-      setOperationAction(ISD::FMULADD, MVT::v2f64, Legal);
-    }
-
     // Partial MLA reductions.
     for (auto Op : {ISD::PARTIAL_REDUCE_SMLA, ISD::PARTIAL_REDUCE_UMLA}) {
       setPartialReduceMLAAction(Op, MVT::v4i32, MVT::v16i8, Legal);
@@ -1129,18 +1120,6 @@ WebAssemblyTargetLowering::getPreferredVectorAction(MVT VT) const {
   return TargetLoweringBase::getPreferredVectorAction(VT);
 }
 
-bool WebAssemblyTargetLowering::isFMAFasterThanFMulAndFAdd(
-    const MachineFunction &MF, EVT VT) const {
-  if (!Subtarget->hasFP16() || !VT.isVector())
-    return false;
-
-  EVT ScalarVT = VT.getScalarType();
-  if (!ScalarVT.isSimple())
-    return false;
-
-  return ScalarVT.getSimpleVT().SimpleTy == MVT::f16;
-}
-
 bool WebAssemblyTargetLowering::shouldSimplifyDemandedVectorElts(
     SDValue Op, const TargetLoweringOpt &TLO) const {
   // ISel process runs DAGCombiner after legalization; this step is called
diff --git a/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.h b/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.h
index 472ec678534a4..b33a8530310be 100644
--- a/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.h
+++ b/llvm/lib/Target/WebAssembly/WebAssemblyISelLowering.h
@@ -81,8 +81,6 @@ class WebAssemblyTargetLowering final : public TargetLowering {
 
   TargetLoweringBase::LegalizeTypeAction
   getPreferredVectorAction(MVT VT) const override;
-  bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF,
-                                  EVT VT) const override;
 
   SDValue LowerCall(CallLoweringInfo &CLI,
                     SmallVectorImpl<SDValue> &InVals) const override;
diff --git a/llvm/lib/Target/WebAssembly/WebAssemblyInstrSIMD.td b/llvm/lib/Target/WebAssembly/WebAssemblyInstrSIMD.td
index 72835b3c6424e..49af78bce68c3 100644
--- a/llvm/lib/Target/WebAssembly/WebAssemblyInstrSIMD.td
+++ b/llvm/lib/Target/WebAssembly/WebAssemblyInstrSIMD.td
@@ -1626,8 +1626,7 @@ defm "" : RelaxedConvert<I32x4, F64x2, int_wasm_relaxed_trunc_unsigned_zero,
 // Relaxed (Negative) Multiply-Add  (madd/nmadd)
 //===----------------------------------------------------------------------===//
 
-multiclass RELAXED_SIMDMADD<Vec vec, bits<32> simdopA, bits<32> simdopS,
-                            list<Predicate> reqs> {
+multiclass SIMDMADD<Vec vec, bits<32> simdopA, bits<32> simdopS, list<Predicate> reqs> {
   defm MADD_#vec :
     SIMD_I<(outs V128:$dst), (ins V128:$a, V128:$b, V128:$c), (outs), (ins),
            [(set (vec.vt V128:$dst), (int_wasm_relaxed_madd
@@ -1641,40 +1640,16 @@ multiclass RELAXED_SIMDMADD<Vec vec, bits<32> simdopA, bits<32> simdopS,
            vec.prefix#".relaxed_nmadd\t$dst, $a, $b, $c",
            vec.prefix#".relaxed_nmadd", simdopS, reqs>;
 
-  def : Pat<(fadd_contract (fmul_contract (vec.vt V128:$a), (vec.vt V128:$b)), (vec.vt V128:$c)),
-            (!cast<Instruction>("MADD_"#vec) V128:$a, V128:$b, V128:$c)>, Requires<reqs>;
-  def : Pat<(fmuladd (vec.vt V128:$a), (vec.vt V128:$b), (vec.vt V128:$c)),
-             (!cast<Instruction>("MADD_"#vec) V128:$a, V128:$b, V128:$c)>, Requires<reqs>;
+  def : Pat<(fadd_contract (vec.vt V128:$a), (fmul_contract (vec.vt V128:$b), (vec.vt V128:$c))),
+             (!cast<Instruction>("MADD_"#vec) V128:$a, V128:$b, V128:$c)>, Requires<[HasRelaxedSIMD]>;
 
-  def : Pat<(fsub_contract (vec.vt V128:$c), (fmul_contract (vec.vt V128:$a), (vec.vt V128:$b))),
-            (!cast<Instruction>("NMADD_"#vec) V128:$a, V128:$b, V128:$c)>, Requires<reqs>;
-  def : Pat<(fmuladd (fneg (vec.vt V128:$a)), (vec.vt V128:$b), (vec.vt V128:$c)),
-             (!cast<Instruction>("NMADD_"#vec) V128:$a, V128:$b, V128:$c)>, Requires<reqs>;
+  def : Pat<(fsub_contract (vec.vt V128:$a), (fmul_contract (vec.vt V128:$b), (vec.vt V128:$c))),
+             (!cast<Instruction>("NMADD_"#vec) V128:$a, V128:$b, V128:$c)>, Requires<[HasRelaxedSIMD]>;
 }
 
-defm "" : RELAXED_SIMDMADD<F32x4, 0x105, 0x106, [HasRelaxedSIMD]>;
-defm "" : RELAXED_SIMDMADD<F64x2, 0x107, 0x108, [HasRelaxedSIMD]>;
-
-//===----------------------------------------------------------------------===//
-// FP16 (Negative) Multiply-Add  (madd/nmadd)
-//===----------------------------------------------------------------------===//
-
-multiclass HALF_PRECISION_SIMDMADD<Vec vec, bits<32> simdopA, bits<32> simdopS,
-                                   list<Predicate> reqs> {
-  defm MADD_#vec :
-    SIMD_I<(outs V128:$dst), (ins V128:$a, V128:$b, V128:$c), (outs), (ins),
-           [(set (vec.vt V128:$dst), (fma
-             (vec.vt V128:$a), (vec.vt V128:$b), (vec.vt V128:$c)))],
-           vec.prefix#".madd\t$dst, $a, $b, $c",
-           vec.prefix#".madd", simdopA, reqs>;
-  defm NMADD_#vec :
-    SIMD_I<(outs V128:$dst), (ins V128:$a, V128:$b, V128:$c), (outs), (ins),
-           [(set (vec.vt V128:$dst), (fma
-             (fneg (vec.vt V128:$a)), (vec.vt V128:$b), (vec.vt V128:$c)))],
-           vec.prefix#".nmadd\t$dst, $a, $b, $c",
-           vec.prefix#".nmadd", simdopS, reqs>;
-}
-defm "" : HALF_PRECISION_SIMDMADD<F16x8, 0x14e, 0x14f, [HasFP16]>;
+defm "" : SIMDMADD<F32x4, 0x105, 0x106, [HasRelaxedSIMD]>;
+defm "" : SIMDMADD<F64x2, 0x107, 0x108, [HasRelaxedSIMD]>;
+defm "" : SIMDMADD<F16x8, 0x14e, 0x14f, [HasFP16]>;
 
 //===----------------------------------------------------------------------===//
 // Laneselect
diff --git a/llvm/test/CodeGen/WebAssembly/simd-relaxed-fma.ll b/llvm/test/CodeGen/WebAssembly/simd-relaxed-fma.ll
index 600241aef99d0..e065de38951b1 100644
--- a/llvm/test/CodeGen/WebAssembly/simd-relaxed-fma.ll
+++ b/llvm/test/CodeGen/WebAssembly/simd-relaxed-fma.ll
@@ -2,278 +2,9 @@
 
 ; RUN: llc < %s -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers  -mattr=+fp16,+simd128,+relaxed-simd | FileCheck %s --check-prefix=RELAXED
 ; RUN: llc < %s -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers  -mattr=+fp16,+simd128,              | FileCheck %s --check-prefix=STRICT
-; RUN: llc < %s -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers  -mattr=+simd128                     | FileCheck %s --check-prefix=NOFP16
-; RUN: llc < %s -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers                                      | FileCheck %s --check-prefix=NOSIMD
 
 target triple = "wasm32"
 
-define half @fadd_fmul_contract_f16(half %a, half %b, half %c) {
-; RELAXED-LABEL: fadd_fmul_contract_f16:
-; RELAXED:         .functype fadd_fmul_contract_f16 (f32, f32, f32) -> (f32)
-; RELAXED-NEXT:  # %bb.0:
-; RELAXED-NEXT:    call $push0=, __truncsfhf2, $0
-; RELAXED-NEXT:    call $push1=, __extendhfsf2, $pop0
-; RELAXED-NEXT:    call $push2=, __truncsfhf2, $1
-; RELAXED-NEXT:    call $push3=, __extendhfsf2, $pop2
-; RELAXED-NEXT:    f32.mul $push4=, $pop1, $pop3
-; RELAXED-NEXT:    call $push5=, __truncsfhf2, $2
-; RELAXED-NEXT:    call $push6=, __extendhfsf2, $pop5
-; RELAXED-NEXT:    f32.add $push7=, $pop4, $pop6
-; RELAXED-NEXT:    return $pop7
-;
-; STRICT-LABEL: fadd_fmul_contract_f16:
-; STRICT:         .functype fadd_fmul_contract_f16 (f32, f32, f32) -> (f32)
-; STRICT-NEXT:  # %bb.0:
-; STRICT-NEXT:    call $push0=, __truncsfhf2, $0
-; STRICT-NEXT:    call $push1=, __extendhfsf2, $pop0
-; STRICT-NEXT:    call $push2=, __truncsfhf2, $1
-; STRICT-NEXT:    call $push3=, __extendhfsf2, $pop2
-; STRICT-NEXT:    f32.mul $push4=, $pop1, $pop3
-; STRICT-NEXT:    call $push5=, __truncsfhf2, $2
-; STRICT-NEXT:    call $push6=, __extendhfsf2, $pop5
-; STRICT-NEXT:    f32.add $push7=, $pop4, $pop6
-; STRICT-NEXT:    return $pop7
-;
-; NOFP16-LABEL: fadd_fmul_contract_f16:
-; NOFP16:         .functype fadd_fmul_contract_f16 (f32, f32, f32) -> (f32)
-; NOFP16-NEXT:  # %bb.0:
-; NOFP16-NEXT:    call $push0=, __truncsfhf2, $0
-; NOFP16-NEXT:    call $push1=, __extendhfsf2, $pop0
-; NOFP16-NEXT:    call $push2=, __truncsfhf2, $1
-; NOFP16-NEXT:    call $push3=, __extendhfsf2, $pop2
-; NOFP16-NEXT:    f32.mul $push4=, $pop1, $pop3
-; NOFP16-NEXT:    call $push5=, __truncsfhf2, $2
-; NOFP16-NEXT:    call $push6=, __extendhfsf2, $pop5
-; NOFP16-NEXT:    f32.add $push7=, $pop4, $pop6
-; NOFP16-NEXT:    return $pop7
-;
-; NOSIMD-LABEL: fadd_fmul_contract_f16:
-; NOSIMD:         .functype fadd_fmul_contract_f16 (f32, f32, f32) -> (f32)
-; NOSIMD-NEXT:  # %bb.0:
-; NOSIMD-NEXT:    call $push0=, __truncsfhf2, $0
-; NOSIMD-NEXT:    call $push1=, __extendhfsf2, $pop0
-; NOSIMD-NEXT:    call $push2=, __truncsfhf2, $1
-; NOSIMD-NEXT:    call $push3=, __extendhfsf2, $pop2
-; NOSIMD-NEXT:    f32.mul $push4=, $pop1, $pop3
-; NOSIMD-NEXT:    call $push5=, __truncsfhf2, $2
-; NOSIMD-NEXT:    call $push6=, __extendhfsf2, $pop5
-; NOSIMD-NEXT:    f32.add $push7=, $pop4, $pop6
-; NOSIMD-NEXT:    return $pop7
-  %mul = fmul contract half %b, %a
-  %add = fadd contract half %mul, %c
-  ret half %add
-}
-
-define half @fmuladd_contract_f16(half %a, half %b, half %c) {
-; RELAXED-LABEL: fmuladd_contract_f16:
-; RELAXED:         .functype fmuladd_contract_f16 (f32, f32, f32) -> (f32)
-; RELAXED-NEXT:  # %bb.0:
-; RELAXED-NEXT:    call $push0=, __truncsfhf2, $1
-; RELAXED-NEXT:    call $push1=, __extendhfsf2, $pop0
-; RELAXED-NEXT:    call $push2=, __truncsfhf2, $0
-; RELAXED-NEXT:    call $push3=, __extendhfsf2, $pop2
-; RELAXED-NEXT:    f32.mul $push4=, $pop1, $pop3
-; RELAXED-NEXT:    call $push5=, __truncsfhf2, $2
-; RELAXED-NEXT:    call $push6=, __extendhfsf2, $pop5
-; RELAXED-NEXT:    f32.add $push7=, $pop4, $pop6
-; RELAXED-NEXT:    return $pop7
-;
-; STRICT-LABEL: fmuladd_contract_f16:
-; STRICT:         .functype fmuladd_contract_f16 (f32, f32, f32) -> (f32)
-; STRICT-NEXT:  # %bb.0:
-; STRICT-NEXT:    call $push0=, __truncsfhf2, $1
-; STRICT-NEXT:    call $push1=, __extendhfsf2, $pop0
-; STRICT-NEXT:    call $push2=, __truncsfhf2, $0
-; STRICT-NEXT:    call $push3=, __extendhfsf2, $pop2
-; STRICT-NEXT:    f32.mul $push4=, $pop1, $pop3
-; STRICT-NEXT:    call $push5=, __truncsfhf2, $2
-; STRICT-NEXT:    call $push6=, __extendhfsf2, $pop5
-; STRICT-NEXT:    f32.add $push7=, $pop4, $pop6
-; STRICT-NEXT:    return $pop7
-;
-; NOFP16-LABEL: fmuladd_contract_f16:
-; NOFP16:         .functype fmuladd_contract_f16 (f32, f32, f32) -> (f32)
-; NOFP16-NEXT:  # %bb.0:
-; NOFP16-NEXT:    call $push0=, __truncsfhf2, $1
-; NOFP16-NEXT:    call $push1=, __extendhfsf2, $pop0
-; NOFP16-NEXT:    call $push2=, __truncsfhf2, $0
-; NOFP16-NEXT:    call $push3=, __extendhfsf2, $pop2
-; NOFP16-NEXT:    f32.mul $push4=, $pop1, $pop3
-; NOFP16-NEXT:    call $push5=, __truncsfhf2, $2
-; NOFP16-NEXT:    call $push6=, __extendhfsf2, $pop5
-; NOFP16-NEXT:    f32.add $push7=, $pop4, $pop6
-; NOFP16-NEXT:    return $pop7
-;
-; NOSIMD-LABEL: fmuladd_contract_f16:
-; NOSIMD:         .functype fmuladd_contract_f16 (f32, f32, f32) -> (f32)
-; NOSIMD-NEXT:  # %bb.0:
-; NOSIMD-NEXT:    call $push0=, __truncsfhf2, $1
-; NOSIMD-NEXT:    call $push1=, __extendhfsf2, $pop0
-; NOSIMD-NEXT:    call $push2=, __truncsfhf2, $0
-; NOSIMD-NEXT:    call $push3=, __extendhfsf2, $pop2
-; NOSIMD-NEXT:    f32.mul $push4=, $pop1, $pop3
-; NOSIMD-NEXT:    call $push5=, __truncsfhf2, $2
-; NOSIMD-NEXT:    call $push6=, __extendhfsf2, $pop5
-; NOSIMD-NEXT:    f32.add $push7=, $pop4, $pop6
-; NOSIMD-NEXT:    return $pop7
-  %fma = call contract half @llvm.fmuladd(half %a, half %b, half %c)
-  ret half %fma
-}
-
-define half @fmuladd_f16(half %a, half %b, half %c) {
-; RELAXED-LABEL: fmuladd_f16:
-; RELAXED:         .functype fmuladd_f16 (f32, f32, f32) -> (f32)
-; RELAXED-NEXT:  # %bb.0:
-; RELAXED-NEXT:    call $push0=, __truncsfhf2, $1
-; RELAXED-NEXT:    call $push1=, __extendhfsf2, $pop0
-; RELAXED-NEXT:    call $pus...
[truncated]
 | 
    
  akadutta 
      pushed a commit
        to akadutta/llvm-project
      that referenced
      this pull request
    
      Oct 14, 2025 
    
    
      
  
    
      
    
  
Reverts llvm#161355 Looks like I've broken some intrinsic code generation.
  
    Sign up for free
    to join this conversation on GitHub.
    Already have an account?
    Sign in to comment
  
      
  Add this suggestion to a batch that can be applied as a single commit.
  This suggestion is invalid because no changes were made to the code.
  Suggestions cannot be applied while the pull request is closed.
  Suggestions cannot be applied while viewing a subset of changes.
  Only one suggestion per line can be applied in a batch.
  Add this suggestion to a batch that can be applied as a single commit.
  Applying suggestions on deleted lines is not supported.
  You must change the existing code in this line in order to create a valid suggestion.
  Outdated suggestions cannot be applied.
  This suggestion has been applied or marked resolved.
  Suggestions cannot be applied from pending reviews.
  Suggestions cannot be applied on multi-line comments.
  Suggestions cannot be applied while the pull request is queued to merge.
  Suggestion cannot be applied right now. Please check back later.
  
    
  
    
Reverts #161355
Looks like I've broken some intrinsic code generation.