JuliaMath
diff --git a/‎src/Bessels.jl
Lines changed: 1 addition & 0 deletions b/‎src/Bessels.jl
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/Float128/besselj.jl
Lines changed: 1 addition & 0 deletions b/‎src/Float128/besselj.jl
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/besselj.jl
Lines changed: 69 additions & 83 deletions b/‎src/besselj.jl
Lines changed: 69 additions & 83 deletions
diff --git a/‎src/bessely.jl
Lines changed: 67 additions & 63 deletions b/‎src/bessely.jl
Lines changed: 67 additions & 63 deletions
@@ -36,6 +36,7 @@ include("Float128/constants.jl")
 include("math_constants.jl")
 include("U_polynomials.jl")
 include("recurrence.jl")
+include("misc.jl")
 #include("hankel.jl")
 
 end
@@ -67,3 +67,4 @@ function besselj0(x::BigFloat)
         return z
     end
 end
+
@@ -1,42 +1,77 @@
-#=
-Cephes Math Library Release 2.8:  June, 2000
-Copyright 1984, 1987, 2000 by Stephen L. Moshier
-https://github.com/jeremybarnes/cephes/blob/master/bessel/j0.c
-https://github.com/jeremybarnes/cephes/blob/master/bessel/j1.c
-=#
-function besselj0(x::Float64)
-    T = Float64
+#    Bessel functions of the first kind of order zero and one
+#                       besselj0, besselj1
+#
+#    Calculation of besselj0 is done in three branches using polynomial approximations
+#
+#    Branch 1: x <= 5.0
+#              besselj0 = (x^2 - r1^2)*(x^2 - r2^2)*P3(x^2) / Q8(x^2)
+#    where r1 and r2 are zeros of J0
+#    and P3 and Q8 are a 3 and 8 degree polynomial respectively
+#    Polynomial coefficients are from [1] which is based on [2]
+#    For tiny arugments the power series expansion is used.
+#
+#    Branch 2: 5.0 < x < 75.0
+#              besselj0 = sqrt(2/(pi*x))*(cos(x - pi/4)*R7(x) - sin(x - pi/4)*R8(x))
+#    Hankel's asymptotic expansion is used
+#    where R7 and R8 are rational functions (Pn(x)/Qn(x)) of degree 7 and 8 respectively
+#    See section 4 of [3] for more details and [1] for coefficients of polynomials
+# 
+#   Branch 3: x >= 75.0
+#              besselj0 = sqrt(2/(pi*x))*beta(x)*(cos(x - pi/4 - alpha(x))
+#   See modified expansions given in [3]. Exact coefficients are used
+#
+#   Calculation of besselj1 is done in a similar way as besselj0.
+#   See [3] for details on similarities.
+# 
+# [1] https://github.com/deepmind/torch-cephes
+# [2] Cephes Math Library Release 2.8:  June, 2000 by Stephen L. Moshier
+# [3] Harrison, John. "Fast and accurate Bessel function computation." 
+#     2009 19th IEEE Symposium on Computer Arithmetic. IEEE, 2009.
+#
+function besselj0(x::T) where T
     x = abs(x)
-    iszero(x) && return one(x)
     isinf(x) && return zero(x)
 
     if x <= 5
         z = x * x
         if x < 1.0e-5
             return 1.0 - z / 4.0
         end
-
-        DR1 = 5.78318596294678452118E0
-        DR2 = 3.04712623436620863991E1
-
+        DR1 = 5.78318596294678452118e0
+        DR2 = 3.04712623436620863991e1
         p = (z - DR1) * (z - DR2)
         p = p * evalpoly(z, RP_j0(T)) / evalpoly(z, RQ_j0(T))
         return p
-    else
+    elseif x < 75.0
         w = 5.0 / x
         q = 25.0 / (x * x)
 
         p = evalpoly(q, PP_j0(T)) / evalpoly(q, PQ_j0(T))
         q = evalpoly(q, QP_j0(T)) / evalpoly(q, QQ_j0(T))
         xn = x - PIO4(T)
-        p = p * cos(xn) - w * q * sin(xn)
+        sc = sincos(xn)
+        p = p * sc[2] - w * q * sc[1]
         return p * SQ2OPI(T) / sqrt(x)
+    else
+        xinv = inv(x)
+        x2 = xinv*xinv
+
+        p = (one(T), -1/16, 53/512, -4447/8192, 5066403/524288)
+        p = evalpoly(x2, p)
+        a = SQ2OPI(T) * sqrt(xinv) * p
+
+        q = (-1/8, 25/384, -1073/5120, 375733/229376, -55384775/2359296)
+        xn = muladd(xinv, evalpoly(x2, q), - PIO4(T))
+
+        # the following computes b = cos(x + xn) more accurately
+        # see src/misc.jl
+        b = cos_sum(x, xn)
+        return a * b
     end
 end
 function besselj0(x::Float32)
     T = Float32
     x = abs(x)
-    iszero(x) && return one(x)
     isinf(x) && return zero(x)
 
     if x <= 2.0f0
@@ -61,28 +96,42 @@ end
 function besselj1(x::Float64)
     T = Float64
     x = abs(x)
-    iszero(x) && return zero(x)
     isinf(x) && return zero(x)
 
     if x <= 5.0
         z = x * x
         w = evalpoly(z, RP_j1(T)) / evalpoly(z, RQ_j1(T))
         w = w * x * (z - 1.46819706421238932572e1) * (z - 4.92184563216946036703e1)
         return w
-    else
+    elseif x < 75.0
         w = 5.0 / x
         z = w * w
         p = evalpoly(z, PP_j1(T)) / evalpoly(z, PQ_j1(T))
         q = evalpoly(z, QP_j1(T)) / evalpoly(z, QQ_j1(T))
         xn = x - THPIO4(T)
-        p = p * cos(xn) - w * q * sin(xn)
+        sc = sincos(xn)
+        p = p * sc[2] - w * q * sc[1]
         return p * SQ2OPI(T) / sqrt(x)
+    else
+        xinv = inv(x)
+        x2 = xinv*xinv
+
+        p = (one(T), 3/16, -99/512, 6597/8192, -4057965/524288)
+        p = evalpoly(x2, p)
+        a = SQ2OPI(T) * sqrt(xinv) * p
+
+        q = (3/8, -21/128, 1899/5120, -543483/229376, 8027901/262144)
+        xn = muladd(xinv, evalpoly(x2, q), - 3 * PIO4(T))
+
+        # the following computes b = cos(x + xn) more accurately
+        # see src/misc.jl
+        b = cos_sum(x, xn)
+        return a * b
     end
 end
 
 function besselj1(x::Float32)
     x = abs(x)
-    iszero(x) && return zero(x)
     isinf(x) && return zero(x)
 
     if x <= 2.0f0
@@ -100,66 +149,3 @@ function besselj1(x::Float32)
         return p
     end
 end
-
-function besselj(n::Int, x::Float64)
-    if n < 0
-        n = -n
-        if (n & 1) == 0
-            sign = 1
-        else
-            sign = -1
-        end
-    else
-        sign = 1
-    end
-
-    if x < zero(x)
-        if (n & 1)
-            sign = -sign
-            x = -x
-        end
-    end
-
-    if n == 0
-        return sign * besselj0(x)
-    elseif n == 1
-        return sign * besselj1(x)
-    elseif n == 2
-        return sign * (2.0 * besselj1(x) / x  -  besselj0(x))
-    end
-
-    #if x < MACHEP
-     #   return 0.0
-    #end
-
-    k = 40 # or 53
-    pk = 2 * (n + k)
-    ans = pk
-    xk = x * x
-
-    for _ in 1:k
-        pk -= 2.0
-        ans = pk - (xk / ans)
-    end
-
-    ans = x / ans
-
-    pk = 1.0
-    pkm1 = inv(ans)
-    k = n - 1
-    r = 2 * k
-
-    for _ in 1:k
-        pkm2 = (pkm1 * r  -  pk * x) / x
-	    pk = pkm1
-	    pkm1 = pkm2
-	    r -= 2.0
-    end
-    if abs(pk) > abs(pkm1)
-        ans = besselj1(x) / pk
-    else
-        ans = besselj0(x) / pkm1
-    end
-
-    return sign * ans
-end
@@ -1,9 +1,33 @@
-#=
-Cephes Math Library Release 2.8:  June, 2000
-Copyright 1984, 1987, 2000 by Stephen L. Moshier
-https://github.com/jeremybarnes/cephes/blob/master/bessel/j0.c
-https://github.com/jeremybarnes/cephes/blob/master/bessel/j1.c
-=#
+#    Bessel functions of the second kind of order zero and one
+#                       bessely0, bessely1
+#
+#    Calculation of bessely0 is done in three branches using polynomial approximations
+#
+#    Branch 1: x <= 5.0
+#              bessely0 = R(x^2) + 2*log(x)*besselj0(x) / pi
+#    where r1 and r2 are zeros of J0
+#    and P3 and Q8 are a 3 and 8 degree polynomial respectively
+#    Polynomial coefficients are from [1] which is based on [2].
+#    For tiny arugments the power series expansion is used.
+#
+#    Branch 2: 5.0 < x < 75.0
+#              bessely0 = sqrt(2/(pi*x))*(sin(x - pi/4)*R7(x) - cos(x - pi/4)*R8(x))
+#    Hankel's asymptotic expansion is used
+#    where R7 and R8 are rational functions (Pn(x)/Qn(x)) of degree 7 and 8 respectively
+#    See section 4 of [3] for more details and [1] for coefficients of polynomials
+# 
+#   Branch 3: x >= 75.0
+#              bessely0 = sqrt(2/(pi*x))*beta(x)*(sin(x - pi/4 - alpha(x))
+#   See modified expansions given in [3]. Exact coefficients are used.
+#
+#   Calculation of bessely1 is done in a similar way as bessely0.
+#   See [3] for details on similarities.
+# 
+# [1] https://github.com/deepmind/torch-cephes
+# [2] Cephes Math Library Release 2.8:  June, 2000 by Stephen L. Moshier
+# [3] Harrison, John. "Fast and accurate Bessel function computation." 
+#     2009 19th IEEE Symposium on Computer Arithmetic. IEEE, 2009.
+#
 function bessely0(x::T) where T <: Union{Float32, Float64}
     if x <= zero(x)
         if iszero(x)
@@ -23,14 +47,30 @@ function _bessely0_compute(x::Float64)
         w = evalpoly(z, YP_y0(T)) / evalpoly(z, YQ_y0(T))
         w += TWOOPI(T) * log(x) * besselj0(x)
         return w
-    else
+    elseif x < 75.0
         w = T(5) / x
         z = w*w
         p = evalpoly(z, PP_y0(T)) / evalpoly(z, PQ_y0(T))
         q = evalpoly(z, QP_y0(T)) / evalpoly(z, QQ_y0(T))
         xn = x - PIO4(T)
-        p = p * sin(xn) + w * q * cos(xn);
+        sc = sincos(xn)
+        p = p * sc[1] + w * q * sc[2]
         return p * SQ2OPI(T) / sqrt(x)
+    else
+        xinv = inv(x)
+        x2 = xinv*xinv
+
+        p = (one(T), -1/16, 53/512, -4447/8192, 5066403/524288)
+        p = evalpoly(x2, p)
+        a = SQ2OPI(T) * sqrt(xinv) * p
+
+        q = (-1/8, 25/384, -1073/5120, 375733/229376, -55384775/2359296)
+        xn = muladd(xinv, evalpoly(x2, q), - PIO4(T))
+
+        # the following computes b = sin(x + xn) more accurately
+        # see src/misc.jl
+        b = sin_sum(x, xn)
+        return a * b
     end
 end
 function _bessely0_compute(x::Float32)
@@ -71,22 +111,38 @@ function _bessely1_compute(x::Float64)
         w = x * (evalpoly(z, YP_y1(T)) / evalpoly(z, YQ_y1(T)))
         w += TWOOPI(T) * (besselj1(x) * log(x) - inv(x))
         return w
-    else
+    elseif x < 75.0
         w = T(5) / x
         z = w * w
         p = evalpoly(z, PP_j1(T)) / evalpoly(z, PQ_j1(T))
         q = evalpoly(z, QP_j1(T)) / evalpoly(z, QQ_j1(T))
         xn = x - THPIO4(T)
-        p = p * sin(xn) + w * q * cos(xn)
+        sc = sincos(xn)
+        p = p * sc[1] + w * q * sc[2]
         return p * SQ2OPI(T) / sqrt(x)
+    else
+        xinv = inv(x)
+        x2 = xinv*xinv
+
+        p = (one(T), 3/16, -99/512, 6597/8192, -4057965/524288)
+        p = evalpoly(x2, p)
+        a = SQ2OPI(T) * sqrt(xinv) * p
+
+        q = (3/8, -21/128, 1899/5120, -543483/229376, 8027901/262144)
+        xn = muladd(xinv, evalpoly(x2, q), - 3 * PIO4(T))
+
+        # the following computes b = sin(x + xn) more accurately
+        # see src/misc.jl
+        b = sin_sum(x, xn)
+        return a * b
     end
 end
 
 function _bessely1_compute(x::Float32)
     T = Float32
     if x <= 2.0f0
         z = x * x
-        YO1 =  4.66539330185668857532f0
+        YO1 = 4.66539330185668857532f0
         w = (z - YO1) * x * evalpoly(z, YP32)
         w += TWOOPI(Float32) * (besselj1(x) * log(x) - inv(x))
         return w
@@ -100,55 +156,3 @@ function _bessely1_compute(x::Float32)
         return p
     end
 end
-
-#	Bessel function of second kind, order zero
-#
-#	Bessel function of second kind, order one
-#=
-Ported to Julia from:
-Cephes Math Library Release 2.2:  June, 1992
-Copyright 1984, 1987, 1992 by Stephen L. Moshier
-Direct inquiries to 30 Frost Street, Cambridge, MA 02140
-https://github.com/jeremybarnes/cephes/blob/master/single/j0f.c
-https://github.com/jeremybarnes/cephes/blob/master/single/j1f.c
-=#
-
-#=
-function bessely(n::Int, x)
-    if n < 0
-        n = -n
-        if n & 1 == 0
-            sign = 1
-        else sign = -1
-        end
-    else
-        sign = 1
-    end
-
-    if n == 0
-        return sign * bessely0(x)
-    elseif n == 1
-        return sign * bessely1(x)
-    end
-
-    if x <= 0.0
-        return NaN
-    end
-
-    anm2 = bessely0(x)
-    anm1 = bessely1(x)
-    an = zero(x)
-
-    k = 1
-    r = 2 * k
-
-    for _ in 1:n
-        an = r * anm1 / x - anm2
-        anm2 = anm1
-        anm1 = an
-        r += 2.0
-    end
-
-    return sign * an
-end
-=#
-Original file line number
+Diff line change
         return z
     end
 end
++