CodeGen: extend f16 conversions to permit types > float.

author Tim Northover <tnorthover@apple.com>

Thu, 17 Jul 2014 10:51:23 +0000 (10:51 +0000)

committer Tim Northover <tnorthover@apple.com>

Thu, 17 Jul 2014 10:51:23 +0000 (10:51 +0000)
author Tim Northover <tnorthover@apple.com>
Thu, 17 Jul 2014 10:51:23 +0000 (10:51 +0000)
committer Tim Northover <tnorthover@apple.com>
Thu, 17 Jul 2014 10:51:23 +0000 (10:51 +0000)
diff --git a/docs/LangRef.rst b/docs/LangRef.rst

index 17bc352f1c89e5da140c160cd80daaf06bd40991..27fe1be116ea64e30aa6a800b58ab09d1fe15586 100644 (file)
--- a/docs/LangRef.rst
+++ b/docs/LangRef.rst
@@ -8653,14 +8653,14 @@ Syntax:
  
  ::
  
-      declare i16 @llvm.convert.to.fp16(float %a)
+      declare i16 @llvm.convert.to.fp16.f32(float %a)
+      declare i16 @llvm.convert.to.fp16.f64(double %a)
  
  Overview:
  """""""""
  
-The '``llvm.convert.to.fp16``' intrinsic function performs a conversion
-from single precision floating point format to half precision floating
-point format.
+The '``llvm.convert.to.fp16``' intrinsic function performs a conversion from a
+conventional floating point type to half precision floating point format.
  
  Arguments:
  """"""""""
@@ -8671,17 +8671,16 @@ converted.
  Semantics:
  """"""""""
  
-The '``llvm.convert.to.fp16``' intrinsic function performs a conversion
-from single precision floating point format to half precision floating
-point format. The return value is an ``i16`` which contains the
-converted number.
+The '``llvm.convert.to.fp16``' intrinsic function performs a conversion from a
+conventional floating point format to half precision floating point format. The
+return value is an ``i16`` which contains the converted number.
  
  Examples:
  """""""""
  
  .. code-block:: llvm
  
-      %res = call i16 @llvm.convert.to.fp16(float %a)
+      %res = call i16 @llvm.convert.to.fp16.f32(float %a)
        store i16 %res, i16* @x, align 2
  
  .. _int_convert_from_fp16:
@@ -8694,7 +8693,8 @@ Syntax:
  
  ::
  
-      declare float @llvm.convert.from.fp16(i16 %a)
+      declare float @llvm.convert.from.fp16.f32(i16 %a)
+      declare double @llvm.convert.from.fp16.f64(i16 %a)
  
  Overview:
  """""""""
diff --git a/include/llvm/CodeGen/ISDOpcodes.h b/include/llvm/CodeGen/ISDOpcodes.h

index a8f2368054953f9d6ce0ede3b99ade6b893026d8..84447616c989116514bc8026a5d69ec0fd3f1fd9 100644 (file)
--- a/include/llvm/CodeGen/ISDOpcodes.h
+++ b/include/llvm/CodeGen/ISDOpcodes.h
@@ -472,11 +472,11 @@ namespace ISD {
      ///   5) ISD::CvtCode indicating the type of conversion to do
      CONVERT_RNDSAT,
  
-    /// FP16_TO_FP32, FP32_TO_FP16 - These operators are used to perform
-    /// promotions and truncation for half-precision (16 bit) floating
-    /// numbers. We need special nodes since FP16 is a storage-only type with
-    /// special semantics of operations.
-    FP16_TO_FP32, FP32_TO_FP16,
+    /// FP16_TO_FP, FP_TO_FP16 - These operators are used to perform promotions
+    /// and truncation for half-precision (16 bit) floating numbers. These nodes
+    /// form a semi-softened interface for dealing with f16 (as an i16), which
+    /// is often a storage-only type but has native conversions.
+    FP16_TO_FP, FP_TO_FP16,
  
      /// FNEG, FABS, FSQRT, FSIN, FCOS, FPOWI, FPOW,
      /// FLOG, FLOG2, FLOG10, FEXP, FEXP2,
diff --git a/include/llvm/IR/Intrinsics.td b/include/llvm/IR/Intrinsics.td

index ae2a90c6295d131509ed2648cb210a5496a47e05..0b8f64fc7984cc1d4e0f73285de7d4be55ac5547 100644 (file)
--- a/include/llvm/IR/Intrinsics.td
+++ b/include/llvm/IR/Intrinsics.td
@@ -496,10 +496,8 @@ def int_donothing : Intrinsic<[], [], [IntrNoMem]>;
  
  // Intrisics to support half precision floating point format
  let Properties = [IntrNoMem] in {
-def int_convert_to_fp16   : Intrinsic<[llvm_i16_ty], [llvm_float_ty]>,
-                            GCCBuiltin<"__gnu_f2h_ieee">;
-def int_convert_from_fp16 : Intrinsic<[llvm_float_ty], [llvm_i16_ty]>,
-                            GCCBuiltin<"__gnu_h2f_ieee">;
+def int_convert_to_fp16   : Intrinsic<[llvm_i16_ty], [llvm_anyfloat_ty]>;
+def int_convert_from_fp16 : Intrinsic<[llvm_anyfloat_ty], [llvm_i16_ty]>;
  }
  
  // These convert intrinsics are to support various conversions between
diff --git a/include/llvm/Target/TargetSelectionDAG.td b/include/llvm/Target/TargetSelectionDAG.td

index 16cfff179c77dd69fd769334c83fe1a1cc504c5e..216416baa93e8fa4cfd19ade2fd6ba192d4be570 100644 (file)
--- a/include/llvm/Target/TargetSelectionDAG.td
+++ b/include/llvm/Target/TargetSelectionDAG.td
@@ -392,8 +392,8 @@ def sint_to_fp : SDNode<"ISD::SINT_TO_FP" , SDTIntToFPOp>;
  def uint_to_fp : SDNode<"ISD::UINT_TO_FP" , SDTIntToFPOp>;
  def fp_to_sint : SDNode<"ISD::FP_TO_SINT" , SDTFPToIntOp>;
  def fp_to_uint : SDNode<"ISD::FP_TO_UINT" , SDTFPToIntOp>;
-def f16_to_f32 : SDNode<"ISD::FP16_TO_FP32", SDTIntToFPOp>;
-def f32_to_f16 : SDNode<"ISD::FP32_TO_FP16", SDTFPToIntOp>;
+def f16_to_fp  : SDNode<"ISD::FP16_TO_FP" , SDTIntToFPOp>;
+def fp_to_f16  : SDNode<"ISD::FP_TO_FP16" , SDTFPToIntOp>;
  
  def setcc      : SDNode<"ISD::SETCC"      , SDTSetCC>;
  def select     : SDNode<"ISD::SELECT"     , SDTSelect>;
diff --git a/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp b/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp

index bff540ad174a9fab1a3f5b3d28585e3f7dcbd787..58f290e113704554fcab75846740533d475ca6d5 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp
+++ b/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp
@@ -1186,6 +1186,7 @@ void SelectionDAGLegalize::LegalizeOp(SDNode *Node) {
      if (Action != TargetLowering::Promote)
        Action = TLI.getOperationAction(Node->getOpcode(), MVT::Other);
      break;
+  case ISD::FP_TO_FP16:
    case ISD::SINT_TO_FP:
    case ISD::UINT_TO_FP:
    case ISD::EXTRACT_VECTOR_ELT:
@@ -3513,10 +3514,26 @@ void SelectionDAGLegalize::ExpandNode(SDNode *Node) {
                                        RTLIB::FMA_F80, RTLIB::FMA_F128,
                                        RTLIB::FMA_PPCF128));
      break;
-  case ISD::FP16_TO_FP32:
-    Results.push_back(ExpandLibCall(RTLIB::FPEXT_F16_F32, Node, false));
+  case ISD::FP16_TO_FP: {
+    if (Node->getValueType(0) == MVT::f32) {
+      Results.push_back(ExpandLibCall(RTLIB::FPEXT_F16_F32, Node, false));
+      break;
+    }
+
+    // We can extend to types bigger than f32 in two steps without changing the
+    // result. Since "f16 -> f32" is much more commonly available, give CodeGen
+    // the option of emitting that before resorting to a libcall.
+    SDValue Res =
+        DAG.getNode(ISD::FP16_TO_FP, dl, MVT::f32, Node->getOperand(0));
+    Results.push_back(
+        DAG.getNode(ISD::FP_EXTEND, dl, Node->getValueType(0), Res));
      break;
-  case ISD::FP32_TO_FP16:
+  }
+  case ISD::FP_TO_FP16:
+    // Can't use two-step truncation here because the rounding may be
+    // significant.
+    assert(Node->getOperand(0).getValueType() == MVT::f32 &&
+           "Don't know libcall for FPROUND_F64_F16");
      Results.push_back(ExpandLibCall(RTLIB::FPROUND_F32_F16, Node, false));
      break;
    case ISD::ConstantFP: {
diff --git a/lib/CodeGen/SelectionDAG/LegalizeFloatTypes.cpp b/lib/CodeGen/SelectionDAG/LegalizeFloatTypes.cpp

index 6b8fec6e824a0b31ff63dba63d2edb5306e3fefe..f6796e0828f248823b8f859553fd76a7a7f1a9e9 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeFloatTypes.cpp
+++ b/lib/CodeGen/SelectionDAG/LegalizeFloatTypes.cpp
@@ -85,7 +85,7 @@ void DAGTypeLegalizer::SoftenFloatResult(SDNode *N, unsigned ResNo) {
      case ISD::FNEG:        R = SoftenFloatRes_FNEG(N); break;
      case ISD::FP_EXTEND:   R = SoftenFloatRes_FP_EXTEND(N); break;
      case ISD::FP_ROUND:    R = SoftenFloatRes_FP_ROUND(N); break;
-    case ISD::FP16_TO_FP32:R = SoftenFloatRes_FP16_TO_FP32(N); break;
+    case ISD::FP16_TO_FP:  R = SoftenFloatRes_FP16_TO_FP(N); break;
      case ISD::FPOW:        R = SoftenFloatRes_FPOW(N); break;
      case ISD::FPOWI:       R = SoftenFloatRes_FPOWI(N); break;
      case ISD::FREM:        R = SoftenFloatRes_FREM(N); break;
@@ -380,11 +380,18 @@ SDValue DAGTypeLegalizer::SoftenFloatRes_FP_EXTEND(SDNode *N) {
  
  // FIXME: Should we just use 'normal' FP_EXTEND / FP_TRUNC instead of special
  // nodes?
-SDValue DAGTypeLegalizer::SoftenFloatRes_FP16_TO_FP32(SDNode *N) {
-  EVT NVT = TLI.getTypeToTransformTo(*DAG.getContext(), N->getValueType(0));
+SDValue DAGTypeLegalizer::SoftenFloatRes_FP16_TO_FP(SDNode *N) {
+  EVT MidVT = TLI.getTypeToTransformTo(*DAG.getContext(), MVT::f32);
    SDValue Op = N->getOperand(0);
-  return TLI.makeLibCall(DAG, RTLIB::FPEXT_F16_F32, NVT, &Op, 1, false,
-                         SDLoc(N)).first;
+  SDValue Res32 = TLI.makeLibCall(DAG, RTLIB::FPEXT_F16_F32, MidVT, &Op, 1,
+                                  false, SDLoc(N)).first;
+  if (N->getValueType(0) == MVT::f32)
+    return Res32;
+
+  EVT NVT = TLI.getTypeToTransformTo(*DAG.getContext(), N->getValueType(0));
+  RTLIB::Libcall LC = RTLIB::getFPEXT(MVT::f32, N->getValueType(0));
+  assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unsupported FP_EXTEND!");
+  return TLI.makeLibCall(DAG, LC, NVT, &Res32, 1, false, SDLoc(N)).first;
  }
  
  SDValue DAGTypeLegalizer::SoftenFloatRes_FP_ROUND(SDNode *N) {
@@ -628,7 +635,7 @@ bool DAGTypeLegalizer::SoftenFloatOperand(SDNode *N, unsigned OpNo) {
    case ISD::FP_ROUND:    Res = SoftenFloatOp_FP_ROUND(N); break;
    case ISD::FP_TO_SINT:  Res = SoftenFloatOp_FP_TO_SINT(N); break;
    case ISD::FP_TO_UINT:  Res = SoftenFloatOp_FP_TO_UINT(N); break;
-  case ISD::FP32_TO_FP16:Res = SoftenFloatOp_FP32_TO_FP16(N); break;
+  case ISD::FP_TO_FP16:  Res = SoftenFloatOp_FP_TO_FP16(N); break;
    case ISD::SELECT_CC:   Res = SoftenFloatOp_SELECT_CC(N); break;
    case ISD::SETCC:       Res = SoftenFloatOp_SETCC(N); break;
    case ISD::STORE:       Res = SoftenFloatOp_STORE(N, OpNo); break;
@@ -704,7 +711,9 @@ SDValue DAGTypeLegalizer::SoftenFloatOp_FP_TO_UINT(SDNode *N) {
    return TLI.makeLibCall(DAG, LC, RVT, &Op, 1, false, SDLoc(N)).first;
  }
  
-SDValue DAGTypeLegalizer::SoftenFloatOp_FP32_TO_FP16(SDNode *N) {
+SDValue DAGTypeLegalizer::SoftenFloatOp_FP_TO_FP16(SDNode *N) {
+  assert(N->getOperand(0).getValueType() == MVT::f32 &&
+         "Cannot soften in one step");
    EVT RVT = N->getValueType(0);
    RTLIB::Libcall LC = RTLIB::FPROUND_F32_F16;
    SDValue Op = GetSoftenedFloat(N->getOperand(0));
diff --git a/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp b/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp

index 6feac0de73f4a06e6b113167d8158f7fd7e06a96..484bcb7cccdef5e478006a354a0b5c0029da4b28 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp
+++ b/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp
@@ -99,7 +99,7 @@ void DAGTypeLegalizer::PromoteIntegerResult(SDNode *N, unsigned ResNo) {
    case ISD::FP_TO_SINT:
    case ISD::FP_TO_UINT:  Res = PromoteIntRes_FP_TO_XINT(N); break;
  
-  case ISD::FP32_TO_FP16:Res = PromoteIntRes_FP32_TO_FP16(N); break;
+  case ISD::FP_TO_FP16:  Res = PromoteIntRes_FP_TO_FP16(N); break;
  
    case ISD::AND:
    case ISD::OR:
@@ -401,7 +401,7 @@ SDValue DAGTypeLegalizer::PromoteIntRes_FP_TO_XINT(SDNode *N) {
                       DAG.getValueType(N->getValueType(0).getScalarType()));
  }
  
-SDValue DAGTypeLegalizer::PromoteIntRes_FP32_TO_FP16(SDNode *N) {
+SDValue DAGTypeLegalizer::PromoteIntRes_FP_TO_FP16(SDNode *N) {
    EVT NVT = TLI.getTypeToTransformTo(*DAG.getContext(), N->getValueType(0));
    SDLoc dl(N);
  
@@ -826,7 +826,7 @@ bool DAGTypeLegalizer::PromoteIntegerOperand(SDNode *N, unsigned OpNo) {
    case ISD::STORE:        Res = PromoteIntOp_STORE(cast<StoreSDNode>(N),
                                                     OpNo); break;
    case ISD::TRUNCATE:     Res = PromoteIntOp_TRUNCATE(N); break;
-  case ISD::FP16_TO_FP32:
+  case ISD::FP16_TO_FP:
    case ISD::UINT_TO_FP:   Res = PromoteIntOp_UINT_TO_FP(N); break;
    case ISD::ZERO_EXTEND:  Res = PromoteIntOp_ZERO_EXTEND(N); break;
  
diff --git a/lib/CodeGen/SelectionDAG/LegalizeTypes.h b/lib/CodeGen/SelectionDAG/LegalizeTypes.h

index d0ca6f870da49f31d4910f8c98eeeafdd8df5568..92a1b70a58c16d7d82656df30fa972a9b0eab9ec 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeTypes.h
+++ b/lib/CodeGen/SelectionDAG/LegalizeTypes.h
@@ -237,7 +237,7 @@ private:
    SDValue PromoteIntRes_CTTZ(SDNode *N);
    SDValue PromoteIntRes_EXTRACT_VECTOR_ELT(SDNode *N);
    SDValue PromoteIntRes_FP_TO_XINT(SDNode *N);
-  SDValue PromoteIntRes_FP32_TO_FP16(SDNode *N);
+  SDValue PromoteIntRes_FP_TO_FP16(SDNode *N);
    SDValue PromoteIntRes_INT_EXTEND(SDNode *N);
    SDValue PromoteIntRes_LOAD(LoadSDNode *N);
    SDValue PromoteIntRes_Overflow(SDNode *N);
@@ -403,7 +403,7 @@ private:
    SDValue SoftenFloatRes_FNEARBYINT(SDNode *N);
    SDValue SoftenFloatRes_FNEG(SDNode *N);
    SDValue SoftenFloatRes_FP_EXTEND(SDNode *N);
-  SDValue SoftenFloatRes_FP16_TO_FP32(SDNode *N);
+  SDValue SoftenFloatRes_FP16_TO_FP(SDNode *N);
    SDValue SoftenFloatRes_FP_ROUND(SDNode *N);
    SDValue SoftenFloatRes_FPOW(SDNode *N);
    SDValue SoftenFloatRes_FPOWI(SDNode *N);
@@ -428,7 +428,7 @@ private:
    SDValue SoftenFloatOp_FP_ROUND(SDNode *N);
    SDValue SoftenFloatOp_FP_TO_SINT(SDNode *N);
    SDValue SoftenFloatOp_FP_TO_UINT(SDNode *N);
-  SDValue SoftenFloatOp_FP32_TO_FP16(SDNode *N);
+  SDValue SoftenFloatOp_FP_TO_FP16(SDNode *N);
    SDValue SoftenFloatOp_SELECT_CC(SDNode *N);
    SDValue SoftenFloatOp_SETCC(SDNode *N);
    SDValue SoftenFloatOp_STORE(SDNode *N, unsigned OpNo);
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

index b85e09d37e99ee38cc9fa0e5e61aadf86df361a9..189b56d5a933041b75e8a0178b85a0580746dd12 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
@@ -5155,12 +5155,13 @@ SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I, unsigned Intrinsic) {
      return nullptr;
    }
    case Intrinsic::convert_to_fp16:
-    setValue(&I, DAG.getNode(ISD::FP32_TO_FP16, sdl,
+    setValue(&I, DAG.getNode(ISD::FP_TO_FP16, sdl,
                               MVT::i16, getValue(I.getArgOperand(0))));
      return nullptr;
    case Intrinsic::convert_from_fp16:
-    setValue(&I, DAG.getNode(ISD::FP16_TO_FP32, sdl,
-                             MVT::f32, getValue(I.getArgOperand(0))));
+    setValue(&I,
+             DAG.getNode(ISD::FP16_TO_FP, sdl, TLI->getValueType(I.getType()),
+                         getValue(I.getArgOperand(0))));
      return nullptr;
    case Intrinsic::pcmarker: {
      SDValue Tmp = getValue(I.getArgOperand(0));
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp b/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp

index b3a452f2148de1349471d1b9cf2f0761fc80a10d..a71cc6859ea0df48b18a35d87cc76bd80e0b6bbb 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp
@@ -236,8 +236,8 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::FP_TO_UINT:                 return "fp_to_uint";
    case ISD::BITCAST:                    return "bitcast";
    case ISD::ADDRSPACECAST:              return "addrspacecast";
-  case ISD::FP16_TO_FP32:               return "fp16_to_fp32";
-  case ISD::FP32_TO_FP16:               return "fp32_to_fp16";
+  case ISD::FP16_TO_FP:                 return "fp16_to_fp";
+  case ISD::FP_TO_FP16:                 return "fp_to_fp16";
  
    case ISD::CONVERT_RNDSAT: {
      switch (cast<CvtRndSatSDNode>(this)->getCvtCode()) {
diff --git a/lib/Target/AArch64/AArch64InstrInfo.td b/lib/Target/AArch64/AArch64InstrInfo.td

index 0fae80219506e7b9e50606b8490c457b2302db00..2708ee03313ecb777971da0452dd3b0ad4ca02a2 100644 (file)
--- a/lib/Target/AArch64/AArch64InstrInfo.td
+++ b/lib/Target/AArch64/AArch64InstrInfo.td
@@ -2244,46 +2244,46 @@ def : Pat<(f64 (fpimm0)), (FMOVXDr XZR)>, Requires<[NoZCZ]>;
  
  defm FCVT : FPConversion<"fcvt">;
  
-def : Pat<(f32_to_f16 FPR32:$Rn),
+def : Pat<(fp_to_f16 FPR32:$Rn),
            (i32 (COPY_TO_REGCLASS
                     (f32 (SUBREG_TO_REG (i32 0), (FCVTHSr FPR32:$Rn), hsub)),
                     GPR32))>;
  
-def : Pat<(f32 (f16_to_f32 i32:$Rn)),
+def : Pat<(f32 (f16_to_fp i32:$Rn)),
            (FCVTSHr (EXTRACT_SUBREG (i32 (COPY_TO_REGCLASS i32:$Rn, FPR32)),
                                     hsub))>;
  
  // When converting from f16 coming directly from a load, make sure we
  // load into the FPR16 registers rather than going through the GPRs.
  //   f16->f32
-def : Pat<(f32 (f16_to_f32 (i32
+def : Pat<(f32 (f16_to_fp (i32
                  (zextloadi16 (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
                                      ro_Wextend16:$extend))))),
            (FCVTSHr (LDRHroW GPR64sp:$Rn, GPR32:$Rm, ro_Wextend16:$extend))>;
-def : Pat<(f32 (f16_to_f32 (i32
+def : Pat<(f32 (f16_to_fp (i32
                  (zextloadi16 (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
                                      ro_Xextend16:$extend))))),
            (FCVTSHr (LDRHroX GPR64sp:$Rn, GPR64:$Rm, ro_Xextend16:$extend))>;
-def : Pat <(f32 (f16_to_f32 (i32
+def : Pat <(f32 (f16_to_fp (i32
                    (zextloadi16 (am_indexed16 GPR64sp:$Rn, uimm12s2:$offset))))),
             (FCVTSHr (LDRHui GPR64sp:$Rn, uimm12s2:$offset))>;
-def : Pat <(f32 (f16_to_f32 (i32
+def : Pat <(f32 (f16_to_fp (i32
                    (zextloadi16 (am_unscaled16 GPR64sp:$Rn, simm9:$offset))))),
             (FCVTSHr (LDURHi GPR64sp:$Rn, simm9:$offset))>;
  
  //   f16->f64
-def : Pat<(f64 (fextend (f32 (f16_to_f32 (i32
+def : Pat<(f64 (fextend (f32 (f16_to_fp (i32
                  (zextloadi16 (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
                                      ro_Wextend16:$extend))))))),
            (FCVTDHr (LDRHroW GPR64sp:$Rn, GPR32:$Rm, ro_Wextend16:$extend))>;
-def : Pat<(f64 (fextend (f32 (f16_to_f32 (i32
+def : Pat<(f64 (fextend (f32 (f16_to_fp (i32
                  (zextloadi16 (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
                                      ro_Xextend16:$extend))))))),
            (FCVTDHr (LDRHroX GPR64sp:$Rn, GPR64:$Rm, ro_Xextend16:$extend))>;
-def : Pat <(f64 (fextend (f32 (f16_to_f32 (i32
+def : Pat <(f64 (fextend (f32 (f16_to_fp (i32
                    (zextloadi16 (am_indexed16 GPR64sp:$Rn, uimm12s2:$offset))))))),
             (FCVTDHr (LDRHui GPR64sp:$Rn, uimm12s2:$offset))>;
-def : Pat <(f64 (fextend (f32 (f16_to_f32 (i32
+def : Pat <(f64 (fextend (f32 (f16_to_fp (i32
                    (zextloadi16 (am_unscaled16 GPR64sp:$Rn, simm9:$offset))))))),
             (FCVTDHr (LDURHi GPR64sp:$Rn, simm9:$offset))>;
  
@@ -2292,37 +2292,37 @@ def : Pat <(f64 (fextend (f32 (f16_to_f32 (i32
  // registers rather than going through the GPRs.
  let AddedComplexity = 10 in {
  // f32->f16
-def : Pat< (truncstorei16 (assertzext (i32 (f32_to_f16 FPR32:$Rt))),
+def : Pat< (truncstorei16 (assertzext (i32 (fp_to_f16 FPR32:$Rt))),
                            (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
                                           ro_Wextend16:$extend)),
             (STRHroW (FCVTHSr FPR32:$Rt), GPR64sp:$Rn, GPR32:$Rm,
                                           ro_Wextend16:$extend)>;
-def : Pat< (truncstorei16 (assertzext (i32 (f32_to_f16 FPR32:$Rt))),
+def : Pat< (truncstorei16 (assertzext (i32 (fp_to_f16 FPR32:$Rt))),
                            (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
                                           ro_Xextend16:$extend)),
             (STRHroX (FCVTHSr FPR32:$Rt), GPR64sp:$Rn, GPR64:$Rm,
                                           ro_Xextend16:$extend)>;
-def : Pat <(truncstorei16 (assertzext (i32 (f32_to_f16 FPR32:$Rt))),
+def : Pat <(truncstorei16 (assertzext (i32 (fp_to_f16 FPR32:$Rt))),
                (am_indexed16 GPR64sp:$Rn, uimm12s2:$offset)),
             (STRHui (FCVTHSr FPR32:$Rt), GPR64sp:$Rn, uimm12s2:$offset)>;
-def : Pat <(truncstorei16 (assertzext (i32 (f32_to_f16 FPR32:$Rt))),
+def : Pat <(truncstorei16 (assertzext (i32 (fp_to_f16 FPR32:$Rt))),
                (am_unscaled16 GPR64sp:$Rn, simm9:$offset)),
             (STURHi (FCVTHSr FPR32:$Rt), GPR64sp:$Rn, simm9:$offset)>;
  // f64->f16
-def : Pat< (truncstorei16 (assertzext (i32 (f32_to_f16 (f32 (fround FPR64:$Rt))))),
+def : Pat< (truncstorei16 (assertzext (i32 (fp_to_f16 (f32 (fround FPR64:$Rt))))),
                            (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
                                           ro_Wextend16:$extend)),
             (STRHroW (FCVTHDr FPR64:$Rt), GPR64sp:$Rn, GPR32:$Rm,
                                           ro_Wextend16:$extend)>;
-def : Pat< (truncstorei16 (assertzext (i32 (f32_to_f16 (f32 (fround FPR64:$Rt))))),
+def : Pat< (truncstorei16 (assertzext (i32 (fp_to_f16 (f32 (fround FPR64:$Rt))))),
                            (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
                                           ro_Xextend16:$extend)),
             (STRHroX (FCVTHDr FPR64:$Rt), GPR64sp:$Rn, GPR64:$Rm,
                                           ro_Xextend16:$extend)>;
-def : Pat <(truncstorei16 (assertzext (i32 (f32_to_f16 (f32 (fround FPR64:$Rt))))),
+def : Pat <(truncstorei16 (assertzext (i32 (fp_to_f16 (f32 (fround FPR64:$Rt))))),
                (am_indexed16 GPR64sp:$Rn, uimm12s2:$offset)),
             (STRHui (FCVTHDr FPR64:$Rt), GPR64sp:$Rn, uimm12s2:$offset)>;
-def : Pat <(truncstorei16 (assertzext (i32 (f32_to_f16 (f32 (fround FPR64:$Rt))))),
+def : Pat <(truncstorei16 (assertzext (i32 (fp_to_f16 (f32 (fround FPR64:$Rt))))),
                (am_unscaled16 GPR64sp:$Rn, simm9:$offset)),
             (STURHi (FCVTHDr FPR64:$Rt), GPR64sp:$Rn, simm9:$offset)>;
  }
diff --git a/lib/Target/ARM/ARMISelLowering.cpp b/lib/Target/ARM/ARMISelLowering.cpp

index 4bfa5a8b5c625312d7b1dba78bf5de57f82ce764..e74d0540eb0f67e321df13ab6e894008006d1c79 100644 (file)
--- a/lib/Target/ARM/ARMISelLowering.cpp
+++ b/lib/Target/ARM/ARMISelLowering.cpp
@@ -827,8 +827,8 @@ ARMTargetLowering::ARMTargetLowering(TargetMachine &TM)
      }
      // Special handling for half-precision FP.
      if (!Subtarget->hasFP16()) {
-      setOperationAction(ISD::FP16_TO_FP32, MVT::f32, Expand);
-      setOperationAction(ISD::FP32_TO_FP16, MVT::i32, Expand);
+      setOperationAction(ISD::FP16_TO_FP, MVT::f32, Expand);
+      setOperationAction(ISD::FP_TO_FP16, MVT::f32, Expand);
      }
    }
  
diff --git a/lib/Target/ARM/ARMInstrVFP.td b/lib/Target/ARM/ARMInstrVFP.td

index 1d7802a2c7fb094f156a7a4139118af75d857f20..e709e59b3fa783e61dda6bb1fad706ba85c02cc3 100644 (file)
--- a/lib/Target/ARM/ARMInstrVFP.td
+++ b/lib/Target/ARM/ARMInstrVFP.td
@@ -551,10 +551,10 @@ def VCVTBSH: ASuI<0b11101, 0b11, 0b0011, 0b01, 0, (outs SPR:$Sd), (ins SPR:$Sm),
                   /* FIXME */ IIC_fpCVTHS, "vcvtb", ".f16.f32\t$Sd, $Sm",
                   [/* For disassembly only; pattern left blank */]>;
  
-def : Pat<(f32_to_f16 SPR:$a),
+def : Pat<(fp_to_f16 SPR:$a),
            (i32 (COPY_TO_REGCLASS (VCVTBSH SPR:$a), GPR))>;
  
-def : Pat<(f16_to_f32 GPR:$a),
+def : Pat<(f16_to_fp GPR:$a),
            (VCVTBHS (COPY_TO_REGCLASS GPR:$a, SPR))>;
  
  def VCVTTHS: ASuI<0b11101, 0b11, 0b0010, 0b11, 0, (outs SPR:$Sd), (ins SPR:$Sm),
diff --git a/lib/Target/NVPTX/NVPTXIntrinsics.td b/lib/Target/NVPTX/NVPTXIntrinsics.td

index 0ad3dfaa4c8f5e50240e4d0d3751550a2f3fc7ee..06873b7d1d899a59d1b990f851c7b4842c6b4e99 100644 (file)
--- a/lib/Target/NVPTX/NVPTXIntrinsics.td
+++ b/lib/Target/NVPTX/NVPTXIntrinsics.td
@@ -792,11 +792,11 @@ def INT_NVVM_H2F : F_MATH_1<!strconcat("{{\n\t",
              "}}")))),
            Float32Regs, Int16Regs, int_nvvm_h2f>;
  
-def : Pat<(f32 (f16_to_f32 Int16Regs:$a)),
+def : Pat<(f32 (f16_to_fp Int16Regs:$a)),
            (CVT_f32_f16 Int16Regs:$a, CvtNONE)>;
-def : Pat<(i16 (f32_to_f16 Float32Regs:$a)),
+def : Pat<(i16 (fp_to_f16 Float32Regs:$a)),
            (CVT_f16_f32 Float32Regs:$a, CvtRN_FTZ)>, Requires<[doF32FTZ]>;
-def : Pat<(i16 (f32_to_f16 Float32Regs:$a)),
+def : Pat<(i16 (fp_to_f16 Float32Regs:$a)),
            (CVT_f16_f32 Float32Regs:$a, CvtRN)>;
  
  //
diff --git a/lib/Target/R600/SIInstructions.td b/lib/Target/R600/SIInstructions.td

index 1a9be6c6157eaf74878e80661025e64bc60c7f09..a4920db33788f5a05a7b44a40ab6c66b9a459e7b 100644 (file)
--- a/lib/Target/R600/SIInstructions.td
+++ b/lib/Target/R600/SIInstructions.td
@@ -1079,10 +1079,10 @@ defm V_CVT_I32_F32 : VOP1_32 <0x00000008, "V_CVT_I32_F32",
  >;
  defm V_MOV_FED_B32 : VOP1_32 <0x00000009, "V_MOV_FED_B32", []>;
  defm V_CVT_F16_F32 : VOP1_32 <0x0000000a, "V_CVT_F16_F32",
-  [(set i32:$dst, (f32_to_f16 f32:$src0))]
+  [(set i32:$dst, (fp_to_f16 f32:$src0))]
  >;
  defm V_CVT_F32_F16 : VOP1_32 <0x0000000b, "V_CVT_F32_F16",
-  [(set f32:$dst, (f16_to_f32 i32:$src0))]
+  [(set f32:$dst, (f16_to_fp i32:$src0))]
  >;
  //defm V_CVT_RPI_I32_F32 : VOP1_32 <0x0000000c, "V_CVT_RPI_I32_F32", []>;
  //defm V_CVT_FLR_I32_F32 : VOP1_32 <0x0000000d, "V_CVT_FLR_I32_F32", []>;
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 19bfa0defe0dba7e87d0230995b61c1abe3b43c6..39186c54f9d48c8e4aacbdfaab50465141082f52 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -519,8 +519,8 @@ void X86TargetLowering::resetOperationActions() {
    // If we don't have F16C support, then lower half float conversions
    // into library calls.
    if (TM.Options.UseSoftFloat || !Subtarget->hasF16C()) {
-    setOperationAction(ISD::FP16_TO_FP32, MVT::f32, Expand);
-    setOperationAction(ISD::FP32_TO_FP16, MVT::i16, Expand);
+    setOperationAction(ISD::FP16_TO_FP, MVT::f32, Expand);
+    setOperationAction(ISD::FP_TO_FP16, MVT::f32, Expand);
    }
  
    if (Subtarget->hasPOPCNT()) {
diff --git a/lib/Target/X86/X86InstrSSE.td b/lib/Target/X86/X86InstrSSE.td

index f9a5ae1a3d524d10ab4ac83230ae1fba92b0f09f..2bb898e7465b2b61e232bfcd22381cd3b1449d26 100644 (file)
--- a/lib/Target/X86/X86InstrSSE.td
+++ b/lib/Target/X86/X86InstrSSE.td
@@ -8540,15 +8540,15 @@ let Predicates = [HasF16C] in {
  
  // Patterns for  matching conversions from float to half-float and vice versa.
  let Predicates = [HasF16C] in {
-  def : Pat<(f32_to_f16 FR32:$src),
+  def : Pat<(fp_to_f16 FR32:$src),
              (i16 (EXTRACT_SUBREG (VMOVPDI2DIrr (VCVTPS2PHrr
                (COPY_TO_REGCLASS FR32:$src, VR128), 0)), sub_16bit))>;
  
-  def : Pat<(f16_to_f32 GR16:$src),
+  def : Pat<(f16_to_fp GR16:$src),
              (f32 (COPY_TO_REGCLASS (VCVTPH2PSrr
                (COPY_TO_REGCLASS (MOVSX32rr16 GR16:$src), VR128)), FR32)) >;
  
-  def : Pat<(f16_to_f32 (i16 (f32_to_f16 FR32:$src))),
+  def : Pat<(f16_to_fp (i16 (fp_to_f16 FR32:$src))),
              (f32 (COPY_TO_REGCLASS (VCVTPH2PSrr
                (VCVTPS2PHrr (COPY_TO_REGCLASS FR32:$src, VR128), 0)), FR32)) >;
  }
diff --git a/test/CodeGen/AArch64/arm64-vcvt_f.ll b/test/CodeGen/AArch64/arm64-vcvt_f.ll

index cad8353a156aa0e5415a8b1790ff4944d4de6daa..1f393c21a1a181535e57beb41bc54cef658d9a99 100644 (file)
--- a/test/CodeGen/AArch64/arm64-vcvt_f.ll
+++ b/test/CodeGen/AArch64/arm64-vcvt_f.ll
@@ -66,7 +66,7 @@ define i16 @to_half(float %in) {
  ; CHECK-LABEL: to_half:
  ; CHECK: fcvt h[[HALFVAL:[0-9]+]], s0
  ; CHECK: fmov {{w[0-9]+}}, {{s[0-9]+}}
-  %res = call i16 @llvm.convert.to.fp16(float %in)
+  %res = call i16 @llvm.convert.to.fp16.f32(float %in)
    ret i16 %res
  }
  
@@ -74,9 +74,9 @@ define float @from_half(i16 %in) {
  ; CHECK-LABEL: from_half:
  ; CHECK: fmov {{s[0-9]+}}, {{w[0-9]+}}
  ; CHECK: fcvt s0, {{h[0-9]+}}
-  %res = call float @llvm.convert.from.fp16(i16 %in)
+  %res = call float @llvm.convert.from.fp16.f32(i16 %in)
    ret float %res
  }
  
-declare float @llvm.convert.from.fp16(i16) #1
-declare i16 @llvm.convert.to.fp16(float) #1
+declare float @llvm.convert.from.fp16.f32(i16) #1
+declare i16 @llvm.convert.to.fp16.f32(float) #1
diff --git a/test/CodeGen/AArch64/f16-convert.ll b/test/CodeGen/AArch64/f16-convert.ll

index 6fabdc5749748bfb2bbda64dfff0a237caf3cd8f..72685e87bd5776185e54376fd1fd34cdd41c7b05 100644 (file)
--- a/test/CodeGen/AArch64/f16-convert.ll
+++ b/test/CodeGen/AArch64/f16-convert.ll
@@ -7,7 +7,7 @@ define float @load0(i16* nocapture readonly %a) nounwind {
  ; CHECK-NEXT: ret
  
    %tmp = load i16* %a, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    ret float %tmp1
  }
  
@@ -18,7 +18,7 @@ define double @load1(i16* nocapture readonly %a) nounwind {
  ; CHECK-NEXT: ret
  
    %tmp = load i16* %a, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    %conv = fpext float %tmp1 to double
    ret double %conv
  }
@@ -32,7 +32,7 @@ define float @load2(i16* nocapture readonly %a, i32 %i) nounwind {
    %idxprom = sext i32 %i to i64
    %arrayidx = getelementptr inbounds i16* %a, i64 %idxprom
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    ret float %tmp1
  }
  
@@ -45,7 +45,7 @@ define double @load3(i16* nocapture readonly %a, i32 %i) nounwind {
    %idxprom = sext i32 %i to i64
    %arrayidx = getelementptr inbounds i16* %a, i64 %idxprom
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    %conv = fpext float %tmp1 to double
    ret double %conv
  }
@@ -58,7 +58,7 @@ define float @load4(i16* nocapture readonly %a, i64 %i) nounwind {
  
    %arrayidx = getelementptr inbounds i16* %a, i64 %i
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    ret float %tmp1
  }
  
@@ -70,7 +70,7 @@ define double @load5(i16* nocapture readonly %a, i64 %i) nounwind {
  
    %arrayidx = getelementptr inbounds i16* %a, i64 %i
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    %conv = fpext float %tmp1 to double
    ret double %conv
  }
@@ -83,7 +83,7 @@ define float @load6(i16* nocapture readonly %a) nounwind {
  
    %arrayidx = getelementptr inbounds i16* %a, i64 10
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    ret float %tmp1
  }
  
@@ -95,7 +95,7 @@ define double @load7(i16* nocapture readonly %a) nounwind {
  
    %arrayidx = getelementptr inbounds i16* %a, i64 10
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    %conv = fpext float %tmp1 to double
    ret double %conv
  }
@@ -108,7 +108,7 @@ define float @load8(i16* nocapture readonly %a) nounwind {
  
    %arrayidx = getelementptr inbounds i16* %a, i64 -10
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    ret float %tmp1
  }
  
@@ -120,7 +120,7 @@ define double @load9(i16* nocapture readonly %a) nounwind {
  
    %arrayidx = getelementptr inbounds i16* %a, i64 -10
    %tmp = load i16* %arrayidx, align 2
-  %tmp1 = tail call float @llvm.convert.from.fp16(i16 %tmp)
+  %tmp1 = tail call float @llvm.convert.from.fp16.f32(i16 %tmp)
    %conv = fpext float %tmp1 to double
    ret double %conv
  }
@@ -131,7 +131,7 @@ define void @store0(i16* nocapture %a, float %val) nounwind {
  ; CHECK-NEXT: str  h0, [x0]
  ; CHECK-NEXT: ret
  
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %val)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %val)
    store i16 %tmp, i16* %a, align 2
    ret void
  }
@@ -143,7 +143,7 @@ define void @store1(i16* nocapture %a, double %val) nounwind {
  ; CHECK-NEXT: ret
  
    %conv = fptrunc double %val to float
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %conv)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %conv)
    store i16 %tmp, i16* %a, align 2
    ret void
  }
@@ -154,7 +154,7 @@ define void @store2(i16* nocapture %a, i32 %i, float %val) nounwind {
  ; CHECK-NEXT: str h0, [x0, w1, sxtw #1]
  ; CHECK-NEXT: ret
  
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %val)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %val)
    %idxprom = sext i32 %i to i64
    %arrayidx = getelementptr inbounds i16* %a, i64 %idxprom
    store i16 %tmp, i16* %arrayidx, align 2
@@ -168,7 +168,7 @@ define void @store3(i16* nocapture %a, i32 %i, double %val) nounwind {
  ; CHECK-NEXT: ret
  
    %conv = fptrunc double %val to float
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %conv)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %conv)
    %idxprom = sext i32 %i to i64
    %arrayidx = getelementptr inbounds i16* %a, i64 %idxprom
    store i16 %tmp, i16* %arrayidx, align 2
@@ -181,7 +181,7 @@ define void @store4(i16* nocapture %a, i64 %i, float %val) nounwind {
  ; CHECK-NEXT: str h0, [x0, x1, lsl #1]
  ; CHECK-NEXT: ret
  
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %val)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %val)
    %arrayidx = getelementptr inbounds i16* %a, i64 %i
    store i16 %tmp, i16* %arrayidx, align 2
    ret void
@@ -194,7 +194,7 @@ define void @store5(i16* nocapture %a, i64 %i, double %val) nounwind {
  ; CHECK-NEXT: ret
  
    %conv = fptrunc double %val to float
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %conv)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %conv)
    %arrayidx = getelementptr inbounds i16* %a, i64 %i
    store i16 %tmp, i16* %arrayidx, align 2
    ret void
@@ -206,7 +206,7 @@ define void @store6(i16* nocapture %a, float %val) nounwind {
  ; CHECK-NEXT: str h0, [x0, #20]
  ; CHECK-NEXT: ret
  
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %val)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %val)
    %arrayidx = getelementptr inbounds i16* %a, i64 10
    store i16 %tmp, i16* %arrayidx, align 2
    ret void
@@ -219,7 +219,7 @@ define void @store7(i16* nocapture %a, double %val) nounwind {
  ; CHECK-NEXT: ret
  
    %conv = fptrunc double %val to float
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %conv)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %conv)
    %arrayidx = getelementptr inbounds i16* %a, i64 10
    store i16 %tmp, i16* %arrayidx, align 2
    ret void
@@ -231,7 +231,7 @@ define void @store8(i16* nocapture %a, float %val) nounwind {
  ; CHECK-NEXT: stur h0, [x0, #-20]
  ; CHECK-NEXT: ret
  
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %val)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %val)
    %arrayidx = getelementptr inbounds i16* %a, i64 -10
    store i16 %tmp, i16* %arrayidx, align 2
    ret void
@@ -244,11 +244,11 @@ define void @store9(i16* nocapture %a, double %val) nounwind {
  ; CHECK-NEXT: ret
  
    %conv = fptrunc double %val to float
-  %tmp = tail call i16 @llvm.convert.to.fp16(float %conv)
+  %tmp = tail call i16 @llvm.convert.to.fp16.f32(float %conv)
    %arrayidx = getelementptr inbounds i16* %a, i64 -10
    store i16 %tmp, i16* %arrayidx, align 2
    ret void
  }
  
-declare i16 @llvm.convert.to.fp16(float) nounwind readnone
-declare float @llvm.convert.from.fp16(i16) nounwind readnone
+declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
+declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
diff --git a/test/CodeGen/ARM/fp16.ll b/test/CodeGen/ARM/fp16.ll

index fba794676d49d44f5b04a3afb2fe992bad9e1497..7a99c175751cdf6be345d4af8d02d515da6fd2bc 100644 (file)
--- a/test/CodeGen/ARM/fp16.ll
+++ b/test/CodeGen/ARM/fp16.ll
@@ -13,20 +13,20 @@ define arm_aapcs_vfpcc void @foo() nounwind {
  entry:
    %0 = load i16* @x, align 2
    %1 = load i16* @y, align 2
-  %2 = tail call float @llvm.convert.from.fp16(i16 %0)
+  %2 = tail call float @llvm.convert.from.fp16.f32(i16 %0)
  ; CHECK: __gnu_h2f_ieee
  ; CHECK-FP16: vcvtb.f32.f16
-  %3 = tail call float @llvm.convert.from.fp16(i16 %1)
+  %3 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
  ; CHECK: __gnu_h2f_ieee
  ; CHECK-FP16: vcvtb.f32.f16
    %4 = fadd float %2, %3
-  %5 = tail call i16 @llvm.convert.to.fp16(float %4)
+  %5 = tail call i16 @llvm.convert.to.fp16.f32(float %4)
  ; CHECK: __gnu_f2h_ieee
  ; CHECK-FP16: vcvtb.f16.f32
    store i16 %5, i16* @x, align 2
    ret void
  }
  
-declare float @llvm.convert.from.fp16(i16) nounwind readnone
+declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
  
-declare i16 @llvm.convert.to.fp16(float) nounwind readnone
+declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
diff --git a/test/CodeGen/R600/fp16_to_fp32.ll b/test/CodeGen/R600/fp16_to_fp32.ll

index fa2e379ef7b4a34686de6494be2d3565e1ec303c..dec53e4ac3441279ea0adb536b902fcd3f5ae78a 100644 (file)
--- a/test/CodeGen/R600/fp16_to_fp32.ll
+++ b/test/CodeGen/R600/fp16_to_fp32.ll
@@ -1,6 +1,6 @@
  ; RUN: llc -march=r600 -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
  
-declare i16 @llvm.convert.to.fp16(float) nounwind readnone
+declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
  
  ; SI-LABEL: @test_convert_fp16_to_fp32:
  ; SI: BUFFER_LOAD_DWORD [[VAL:v[0-9]+]]
@@ -8,7 +8,7 @@ declare i16 @llvm.convert.to.fp16(float) nounwind readnone
  ; SI: BUFFER_STORE_SHORT [[RESULT]]
  define void @test_convert_fp16_to_fp32(i16 addrspace(1)* noalias %out, float addrspace(1)* noalias %in) nounwind {
    %val = load float addrspace(1)* %in, align 4
-  %cvt = call i16 @llvm.convert.to.fp16(float %val) nounwind readnone
+  %cvt = call i16 @llvm.convert.to.fp16.f32(float %val) nounwind readnone
    store i16 %cvt, i16 addrspace(1)* %out, align 2
    ret void
  }
diff --git a/test/CodeGen/R600/fp32_to_fp16.ll b/test/CodeGen/R600/fp32_to_fp16.ll

index 9997cd3c08f1ef22ce2e0c0b1bd50acf90619edc..3a051f8f67723c2d27dc4828a6e94696bbd3ecf2 100644 (file)
--- a/test/CodeGen/R600/fp32_to_fp16.ll
+++ b/test/CodeGen/R600/fp32_to_fp16.ll
@@ -1,6 +1,6 @@
  ; RUN: llc -march=r600 -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
  
-declare float @llvm.convert.from.fp16(i16) nounwind readnone
+declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
  
  ; SI-LABEL: @test_convert_fp16_to_fp32:
  ; SI: BUFFER_LOAD_USHORT [[VAL:v[0-9]+]]
@@ -8,7 +8,7 @@ declare float @llvm.convert.from.fp16(i16) nounwind readnone
  ; SI: BUFFER_STORE_DWORD [[RESULT]]
  define void @test_convert_fp16_to_fp32(float addrspace(1)* noalias %out, i16 addrspace(1)* noalias %in) nounwind {
    %val = load i16 addrspace(1)* %in, align 2
-  %cvt = call float @llvm.convert.from.fp16(i16 %val) nounwind readnone
+  %cvt = call float @llvm.convert.from.fp16.f32(i16 %val) nounwind readnone
    store float %cvt, float addrspace(1)* %out, align 4
    ret void
  }
diff --git a/test/CodeGen/X86/cvt16.ll b/test/CodeGen/X86/cvt16.ll

index 951b5c3ed3892e8dc3ae890692e26a0581557485..f3d8049321007cdeba1043071206f5d944af60c2 100644 (file)
--- a/test/CodeGen/X86/cvt16.ll
+++ b/test/CodeGen/X86/cvt16.ll
@@ -21,7 +21,7 @@
  
  
  define void @test1(float %src, i16* %dest) {
-  %1 = tail call i16 @llvm.convert.to.fp16(float %src)
+  %1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
    store i16 %1, i16* %dest, align 2
    ret void
  }
@@ -34,7 +34,7 @@ define void @test1(float %src, i16* %dest) {
  
  define float @test2(i16* nocapture %src) {
    %1 = load i16* %src, align 2
-  %2 = tail call float @llvm.convert.from.fp16(i16 %1)
+  %2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
    ret float %2
  }
  ; CHECK-LABEL: test2:
@@ -45,8 +45,8 @@ define float @test2(i16* nocapture %src) {
  
  
  define float @test3(float %src) nounwind uwtable readnone {
-  %1 = tail call i16 @llvm.convert.to.fp16(float %src)
-  %2 = tail call float @llvm.convert.from.fp16(i16 %1)
+  %1 = tail call i16 @llvm.convert.to.fp16.f32(float %src)
+  %2 = tail call float @llvm.convert.from.fp16.f32(i16 %1)
    ret float %2
  }
  
@@ -59,6 +59,6 @@ define float @test3(float %src) nounwind uwtable readnone {
  ; F16C-NEXT: vcvtph2ps
  ; F16C: ret
  
-declare float @llvm.convert.from.fp16(i16) nounwind readnone
-declare i16 @llvm.convert.to.fp16(float) nounwind readnone
+declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
+declare i16 @llvm.convert.to.fp16.f32(float) nounwind readnone
author	Tim Northover <tnorthover@apple.com>
	Thu, 17 Jul 2014 10:51:23 +0000 (10:51 +0000)
committer	Tim Northover <tnorthover@apple.com>
	Thu, 17 Jul 2014 10:51:23 +0000 (10:51 +0000)
docs/LangRef.rst		patch \| blob \| history
include/llvm/CodeGen/ISDOpcodes.h		patch \| blob \| history
include/llvm/IR/Intrinsics.td		patch \| blob \| history
include/llvm/Target/TargetSelectionDAG.td		patch \| blob \| history
lib/CodeGen/SelectionDAG/LegalizeDAG.cpp		patch \| blob \| history
lib/CodeGen/SelectionDAG/LegalizeFloatTypes.cpp		patch \| blob \| history
lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp		patch \| blob \| history
lib/CodeGen/SelectionDAG/LegalizeTypes.h		patch \| blob \| history
lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp		patch \| blob \| history
lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp		patch \| blob \| history
lib/Target/AArch64/AArch64InstrInfo.td		patch \| blob \| history
lib/Target/ARM/ARMISelLowering.cpp		patch \| blob \| history
lib/Target/ARM/ARMInstrVFP.td		patch \| blob \| history
lib/Target/NVPTX/NVPTXIntrinsics.td		patch \| blob \| history
lib/Target/R600/SIInstructions.td		patch \| blob \| history
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
lib/Target/X86/X86InstrSSE.td		patch \| blob \| history
test/CodeGen/AArch64/arm64-vcvt_f.ll		patch \| blob \| history
test/CodeGen/AArch64/f16-convert.ll		patch \| blob \| history
test/CodeGen/ARM/fp16.ll		patch \| blob \| history
test/CodeGen/R600/fp16_to_fp32.ll		patch \| blob \| history
test/CodeGen/R600/fp32_to_fp16.ll		patch \| blob \| history
test/CodeGen/X86/cvt16.ll		patch \| blob \| history