Merge pull request #378 from JuliaDiff/ox/tansym

oxinabox · web-flow · commit 24318b0321cc · 2021-02-17T22:26:33.000Z
symmetric.jl autotangent
diff --git a/test/rulesets/LinearAlgebra/symmetric.jl b/test/rulesets/LinearAlgebra/symmetric.jl
@@ -4,72 +4,65 @@
         T in (Float64, ComplexF64),
         uplo in (:U, :L)
 
-        N = 3
         @testset "frule" begin
-            x = randn(T, N, N)
-            Δx = randn(T, N, N)
-            # can't use frule_test here because it doesn't yet ignore nothing tangents
-            Ω = SymHerm(x, uplo)
-            Ω_ad, ∂Ω_ad = frule((Zero(), Δx, Zero()), SymHerm, x, uplo)
-            @test Ω_ad == Ω
-            ∂Ω_fd = jvp(_fdm, z -> SymHerm(z, uplo), (x, Δx))
-            @test ∂Ω_ad ≈ ∂Ω_fd
+            test_frule(SymHerm, rand(T, 3, 3), uplo ⊢ nothing)
         end
         @testset "rrule" begin
             # on old versions of julia this combination doesn't infer but we don't care as
             # it infers fine on modern versions.
             check_inferred = !(VERSION < v"1.5" && T <: ComplexF64 && SymHerm <: Hermitian)
 
-            x = randn(T, N, N)
-            ∂x = randn(T, N, N)
-            ΔΩ = randn(T, N, N)
             @testset "back(::$MT)" for MT in (Matrix, LowerTriangular, UpperTriangular)
-                rrule_test(
-                    SymHerm, MT(ΔΩ), (x, ∂x), (uplo, nothing);
+                x = randn(T, 3, 3)
+                ΔΩ = MT(randn(T, 3, 3))
+                test_rrule(
+                    SymHerm, x, uplo ⊢ nothing;
+                    output_tangent = ΔΩ,
                     # type stability here critically relies on uplo being constant propagated,
                     # so we need to test this more carefully below
                     check_inferred=false,
                 )
                 if check_inferred
-                    @inferred (function (SymHerm, x, ΔΩ, ::Val{uplo}) where {uplo}
+                    @inferred (function (SymHerm, x, ΔΩ, ::Val)
                         return rrule(SymHerm, x, uplo)[2](ΔΩ)
-                    end)(SymHerm, x, MT(ΔΩ), Val(uplo))
+                    end)(SymHerm, x, ΔΩ, Val(uplo))
                 end
             end
             @testset "back(::Diagonal)" begin
-                rrule_test(
-                    SymHerm, Diagonal(ΔΩ), (x, Diagonal(∂x)), (uplo, nothing);
+                x = randn(T, 3, 3)
+                ΔΩ = Diagonal(randn(T, 3, 3))
+                test_rrule(
+                    SymHerm, x ⊢ Diagonal(randn(T, 3)), uplo ⊢ nothing;
                     check_inferred=false,
+                    output_tangent = ΔΩ,
                 )
                 if check_inferred
-                    @inferred (function (SymHerm, x, ΔΩ, ::Val{uplo}) where {uplo}
+                    @inferred (function (SymHerm, x, ΔΩ, ::Val)
                         return rrule(SymHerm, x, uplo)[2](ΔΩ)
-                    end)(SymHerm, x, Diagonal(ΔΩ), Val(uplo))
+                    end)(SymHerm, x, ΔΩ, Val(uplo))
                 end
             end
         end
     end
+    # constructing a `Matrix`/`Array` from `SymHerm`
     @testset "$(f)(::$(SymHerm){$T}) with uplo=:$uplo" for f in (Matrix, Array),
         SymHerm in (Symmetric, Hermitian),
         T in (Float64, ComplexF64),
         uplo in (:U, :L)
 
-        N = 3
-        x = SymHerm(randn(T, N, N), uplo)
-        Δx = randn(T, N, N)
-        ∂x = SymHerm(randn(T, N, N), uplo)
-        ΔΩ = f(SymHerm(randn(T, N, N), uplo))
-        frule_test(f, (x, Δx))
-        frule_test(f, (x, SymHerm(Δx, uplo)))
-        rrule_test(f, ΔΩ, (x, ∂x))
+        x = SymHerm(randn(T, 3, 3), uplo)
+        test_rrule(f, x)
+
+        # intentionally specifying tangents here to test both Matrix and SymHerm tangents
+        test_frule(f, x ⊢ randn(T, 3, 3))
+        test_frule(f, x ⊢ SymHerm(randn(T, 3, 3), uplo))
     end
 
     # symmetric/hermitian eigendecomposition follows the sign convention
     # v = v * sign(real(vₖ)) * sign(vₖ)', where vₖ is the first or last coordinate
     # in the eigenvector. This is unstable for finite differences, but using the convention
     # v = v * sign(vₖ)' seems to be more stable, the (co)tangents are related as
     # ∂v_ad = sign(real(vₖ)) * ∂v_fd
-
     function _eigvecs_stabilize_mat(vectors, uplo)
         Ui = Symbol(uplo) === :U ? @view(vectors[end, :]) : @view(vectors[1, :])
         return Diagonal(conj.(sign.(Ui)))