Merge pull request #3655 from sejongoh/fix_u64_to_f64_cast

sejongoh · sejongoh · commit 1cd5d1b11229 · 2016-03-18T19:23:15.000-07:00
Fix inconsistent uint64-to-double cast
diff --git a/src/jit/codegenxarch.cpp b/src/jit/codegenxarch.cpp
@@ -7502,6 +7502,10 @@ CodeGen::genIntToFloatCast(GenTreePtr treeNode)
     // result if sign-bit of srcType is set.
     if (srcType == TYP_ULONG)
     {
+        // The instruction sequence below is less accurate than what clang
+        // and gcc generate. However, we keep the current sequence for backward compatiblity.
+        // If we change the instructions below, FloatingPointUtils::convertUInt64ToDobule
+        // should be also updated for consistent conversion result.
         assert(dstType == TYP_DOUBLE);
         assert(!op1->isContained());
 
diff --git a/src/jit/gentree.cpp b/src/jit/gentree.cpp
@@ -9954,7 +9954,7 @@ GenTreePtr                  Compiler::gtFoldExprConst(GenTreePtr tree)
                 case TYP_DOUBLE:
                     if ((tree->gtFlags & GTF_UNSIGNED) && lval1 < 0)
                     {
-                        d1 = (double) (unsigned __int64) lval1;
+                        d1 = FloatingPointUtils::convertUInt64ToDouble((unsigned __int64)lval1);
                     }
                     else
                     {
@@ -10074,29 +10074,8 @@ GenTreePtr                  Compiler::gtFoldExprConst(GenTreePtr tree)
                     lval1 = INT64(d1);      goto CNS_LONG;
 
                 case TYP_ULONG:
-                    if (d1 >= 0.0)
-                    {
-                        // Work around a C++ issue where it doesn't properly convert large positive doubles
-                        const double two63  = 2147483648.0 * 4294967296.0;
-                        if (d1 < two63) {
-                            lval1 = UINT64(d1);
-                        }
-                        else {        
-                            // subtract 0x8000000000000000, do the convert then add it back again
-                            lval1 = INT64(d1 - two63) + I64(0x8000000000000000);
-                        }
-                        goto CNS_LONG;
-                    }
-                    
-                    // This double cast to account for an ECMA spec hole.
-                    // When converting from a double to an unsigned the ECMA
-                    // spec states that a conforming implementation should 
-                    // "truncate to zero." However that doesn't make much sense
-                    // when the double in question is negative and the target
-                    // is unsigned. gcc converts a negative double to zero when
-                    // cast to an unsigned. To make gcc conform to MSVC behavior
-                    // this cast is necessary.
-                    lval1 = UINT64(INT64(d1));     goto CNS_LONG;
+                    lval1 = FloatingPointUtils::convertDoubleToUInt64(d1);
+                    goto CNS_LONG;
 
                 case TYP_FLOAT:
                     d1 = forceCastToFloat(d1);  
diff --git a/src/jit/utils.cpp b/src/jit/utils.cpp
@@ -1544,3 +1544,66 @@ unsigned            CountDigits(unsigned num, unsigned base /* = 10 */)
 }
 
 #endif // DEBUG
+
+
+double FloatingPointUtils::convertUInt64ToDouble(unsigned __int64 uIntVal) {
+    __int64 s64 = uIntVal; 
+    double d;
+    if (s64 < 0) {
+#if defined(_TARGET_XARCH_)
+        // RyuJIT codegen and clang (or gcc) may produce different results for casting uint64 to 
+        // double, and the clang result is more accurate. For example,
+        //    1) (double)0x84595161401484A0UL --> 43e08b2a2c280290  (RyuJIT codegen or VC++)
+        //    2) (double)0x84595161401484A0UL --> 43e08b2a2c280291  (clang or gcc)
+        // If the folding optimization below is implemented by simple casting of (double)uint64_val
+        // and it is compiled by clang, casting result can be inconsistent, depending on whether
+        // the folding optimization is triggered or the codegen generates instructions for casting.                        //
+        // The current solution is to force the same math as the codegen does, so that casting
+        // result is always consistent.
+
+        // d = (double)(int64_t)uint64 + 0x1p64
+        uint64_t adjHex = 0x43F0000000000000UL;
+        d = (double)s64 + *(double*)&adjHex;
+#else
+        d = (double)uIntVal;
+#endif
+    }
+    else 
+    {
+        d = (double)uIntVal;
+    }
+    return d;
+}
+
+float FloatingPointUtils::convertUInt64ToFloat(unsigned __int64 u64) {
+    double d = convertUInt64ToDouble(u64);
+    return (float)d;
+}
+
+unsigned __int64 FloatingPointUtils::convertDoubleToUInt64(double d) {
+    unsigned __int64 u64;
+    if (d >= 0.0)
+    {
+        // Work around a C++ issue where it doesn't properly convert large positive doubles
+        const double two63 = 2147483648.0 * 4294967296.0;
+        if (d < two63) {
+            u64 = UINT64(d);
+        }
+        else {
+            // subtract 0x8000000000000000, do the convert then add it back again
+            u64 = INT64(d - two63) + I64(0x8000000000000000);
+        }
+        return u64;
+    }
+
+    // This double cast to account for an ECMA spec hole.
+    // When converting from a double to an unsigned the ECMA
+    // spec states that a conforming implementation should 
+    // "truncate to zero." However that doesn't make much sense
+    // when the double in question is negative and the target
+    // is unsigned. gcc converts a negative double to zero when
+    // cast to an unsigned. To make gcc conform to MSVC behavior
+    // this cast is necessary.
+    u64 = UINT64(INT64(d));     
+    return u64;
+}
diff --git a/src/jit/utils.h b/src/jit/utils.h
@@ -510,4 +510,17 @@ struct ListNode
     }
 };
 
+/*****************************************************************************
+* Floating point utility class 
+*/
+class FloatingPointUtils {
+public:
+
+    static double convertUInt64ToDouble(unsigned __int64 u64);
+
+    static float convertUInt64ToFloat(unsigned __int64 u64);
+
+    static unsigned __int64 convertDoubleToUInt64(double d);
+};
+
 #endif // _UTILS_H_
diff --git a/src/jit/valuenum.cpp b/src/jit/valuenum.cpp
@@ -1906,13 +1906,13 @@ ValueNum ValueNumStore::EvalCastForConstantArgs(var_types typ, VNFunc func, Valu
                 case TYP_FLOAT:
                     assert(typ == TYP_FLOAT);
                      if (srcIsUnsigned)
-                         return VNForFloatCon(float(UINT64(arg0Val)));
+                         return VNForFloatCon(FloatingPointUtils::convertUInt64ToFloat(UINT64(arg0Val)));
                      else
                          return VNForFloatCon(float(arg0Val));
                 case TYP_DOUBLE:
                     assert(typ == TYP_DOUBLE);
                      if (srcIsUnsigned)
-                         return VNForDoubleCon(double(UINT64(arg0Val)));
+                         return VNForDoubleCon(FloatingPointUtils::convertUInt64ToDouble(UINT64(arg0Val)));
                      else
                          return VNForDoubleCon(double(arg0Val));
                 default:
diff --git a/tests/src/JIT/Regression/JitBlue/GitHub_3449/GitHub_3449.cs b/tests/src/JIT/Regression/JitBlue/GitHub_3449/GitHub_3449.cs
@@ -0,0 +1,42 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information
+
+using System;
+
+public class Program
+{
+    // RyuJIT codegen and clang (or gcc) may produce different results for casting uint64 to 
+    // double, and the clang result is more accurate. For example,
+    //    1) (double)0x84595161401484A0UL --> 43e08b2a2c280290  (RyuJIT codegen or VC++)
+    //    2) (double)0x84595161401484A0UL --> 43e08b2a2c280291  (clang or gcc)
+    // Constant folding in RyuJIT simply does (double)0x84595161401484A0UL in its C++ implementation.
+    // If it is compiled by clang, the example unsigned value and cast tree node are folded into 
+    // 43e08b2a2c280291, which is different from what the codegen produces. To fix this inconsistency,
+    // the constant folding is forced to have the same behavior as the codegen, and the result
+    // must be always 43e08b2a2c280290.
+    public static int Main(string[] args)
+    {
+        //Check if the test is being executed on ARMARCH
+        bool isProcessorArmArch = false;        
+        string processorArchEnvVar = null;
+        processorArchEnvVar = Environment.GetEnvironmentVariable("PROCESSOR_ARCHITECTURE");
+        
+        if ((processorArchEnvVar != null)
+            && (processorArchEnvVar.Equals("ARM", StringComparison.CurrentCultureIgnoreCase)
+                || processorArchEnvVar.Equals("ARM64", StringComparison.CurrentCultureIgnoreCase)))
+        {
+            isProcessorArmArch = true;
+        }        
+        
+        ulong u64 = 0x84595161401484A0UL;
+        double f64 = (double)u64;        
+        long h64 = BitConverter.DoubleToInt64Bits(f64);            
+        long expected_h64 = isProcessorArmArch ? 0x43e08b2a2c280291L : 0x43e08b2a2c280290L;
+        if (h64 != expected_h64) {
+            Console.WriteLine(String.Format("Expected: 0x{0:x}\nActual: 0x{1:x}", expected_h64, h64));
+            return -1;
+        }
+        return 100;
+    }
+}
diff --git a/tests/src/JIT/Regression/JitBlue/GitHub_3449/GitHub_3449.csproj b/tests/src/JIT/Regression/JitBlue/GitHub_3449/GitHub_3449.csproj
@@ -0,0 +1,50 @@
+<?xml version="1.0" encoding="utf-8"?>
+<Project ToolsVersion="12.0" DefaultTargets="Build" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
+  <Import Project="$([MSBuild]::GetDirectoryNameOfFileAbove($(MSBuildThisFileDirectory), dir.props))\dir.props" />
+  <PropertyGroup>
+    <Configuration Condition=" '$(Configuration)' == '' ">Debug</Configuration>
+    <Platform Condition=" '$(Platform)' == '' ">AnyCPU</Platform>
+    <AssemblyName>$(MSBuildProjectName)</AssemblyName>
+    <SchemaVersion>2.0</SchemaVersion>
+    <ProjectGuid>{95DFC527-4DC1-495E-97D7-E94EE1F7140D}</ProjectGuid>
+    <OutputType>Exe</OutputType>
+    <AppDesignerFolder>Properties</AppDesignerFolder>
+    <FileAlignment>512</FileAlignment>
+    <ProjectTypeGuids>{786C830F-07A1-408B-BD7F-6EE04809D6DB};{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}</ProjectTypeGuids>
+    <ReferencePath>$(ProgramFiles)\Common Files\microsoft shared\VSTT\11.0\UITestExtensionPackages</ReferencePath>
+    <SolutionDir Condition="$(SolutionDir) == '' Or $(SolutionDir) == '*Undefined*'">..\..\</SolutionDir>
+
+    <NuGetPackageImportStamp>7a9bfb7d</NuGetPackageImportStamp>
+  </PropertyGroup>
+  <!-- Default configurations to help VS understand the configurations -->
+  <PropertyGroup Condition=" '$(Configuration)|$(Platform)' == 'Debug|AnyCPU' ">
+  </PropertyGroup>
+  <PropertyGroup Condition=" '$(Configuration)|$(Platform)' == 'Release|AnyCPU' ">
+  </PropertyGroup>
+  <ItemGroup>
+    <CodeAnalysisDependentAssemblyPaths Condition=" '$(VS100COMNTOOLS)' != '' " Include="$(VS100COMNTOOLS)..\IDE\PrivateAssemblies">
+      <Visible>False</Visible>
+    </CodeAnalysisDependentAssemblyPaths>
+  </ItemGroup>
+  <PropertyGroup>
+    <DebugType></DebugType>
+    <Optimize>True</Optimize>
+  </PropertyGroup>
+  <ItemGroup>
+    <Compile Include="$(MSBuildProjectName).cs" />
+  </ItemGroup>
+  <ItemGroup>
+    <None Include="$(JitPackagesConfigFileDirectory)minimal\project.json" />
+    <None Include="app.config" />
+  </ItemGroup>
+  <ItemGroup>
+    <Service Include="{82A7F48D-3B50-4B1E-B82E-3ADA8210C358}" />
+  </ItemGroup>
+  <PropertyGroup>
+    <ProjectJson>$(JitPackagesConfigFileDirectory)minimal\project.json</ProjectJson>
+    <ProjectLockJson>$(JitPackagesConfigFileDirectory)minimal\project.lock.json</ProjectLockJson>
+  </PropertyGroup>
+  <Import Project="$([MSBuild]::GetDirectoryNameOfFileAbove($(MSBuildThisFileDirectory), dir.targets))\dir.targets" />
+  <PropertyGroup Condition=" '$(MsBuildProjectDirOverride)' != '' ">
+  </PropertyGroup> 
+</Project>
diff --git a/tests/src/JIT/Regression/JitBlue/GitHub_3449/app.config b/tests/src/JIT/Regression/JitBlue/GitHub_3449/app.config
@@ -0,0 +1,27 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<configuration>
+  <runtime>
+    <assemblyBinding xmlns="urn:schemas-microsoft-com:asm.v1">
+      <dependentAssembly>
+        <assemblyIdentity name="System.Runtime" publicKeyToken="b03f5f7f11d50a3a" culture="neutral" />
+        <bindingRedirect oldVersion="0.0.0.0-4.0.20.0" newVersion="4.0.20.0" />
+      </dependentAssembly>
+      <dependentAssembly>
+        <assemblyIdentity name="System.Text.Encoding" publicKeyToken="b03f5f7f11d50a3a" culture="neutral" />
+        <bindingRedirect oldVersion="0.0.0.0-4.0.10.0" newVersion="4.0.10.0" />
+      </dependentAssembly>
+      <dependentAssembly>
+        <assemblyIdentity name="System.Threading.Tasks" publicKeyToken="b03f5f7f11d50a3a" culture="neutral" />
+        <bindingRedirect oldVersion="0.0.0.0-4.0.10.0" newVersion="4.0.10.0" />
+      </dependentAssembly>
+      <dependentAssembly>
+        <assemblyIdentity name="System.IO" publicKeyToken="b03f5f7f11d50a3a" culture="neutral" />
+        <bindingRedirect oldVersion="0.0.0.0-4.0.10.0" newVersion="4.0.10.0" />
+      </dependentAssembly>
+      <dependentAssembly>
+        <assemblyIdentity name="System.Reflection" publicKeyToken="b03f5f7f11d50a3a" culture="neutral" />
+        <bindingRedirect oldVersion="0.0.0.0-4.0.10.0" newVersion="4.0.10.0" />
+      </dependentAssembly>
+    </assemblyBinding>
+  </runtime>
+</configuration>