add tests from ForwardDiff

mcabbott · mcabbott · commit fe14fa2f3568 · 2022-01-14T01:46:26.000-05:00
diff --git a/test/Project.toml b/test/Project.toml
@@ -2,6 +2,7 @@
 ChainRules = "082447d4-558c-5d27-93f4-14fc19e9eca2"
 ChainRulesCore = "d360d2e6-b24c-11e9-a2a3-2a2ae2dbcce4"
 Combinatorics = "861a8166-3701-5b0c-9a16-15d98fcdc6aa"
+DiffTests = "de460e47-3fe3-5279-bb4a-814414816d5d"
 Distributed = "8ba89e20-285c-5b6f-9357-94700520ee1b"
 FiniteDifferences = "26cc04aa-876d-5657-8c51-4c34ba976000"
 ForwardDiff = "f6369f11-7733-5829-9624-2563aa707210"
@@ -19,6 +20,7 @@ Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 ChainRules = "1.5"
 ChainRulesCore = "1.2"
 Combinatorics = "1"
+DiffTests = "0.1.1"
 StaticArrays = "1"
 StatsBase = "0.33"
 StructArrays = "0.6"
diff --git a/test/forwarddiff.jl b/test/forwarddiff.jl
@@ -0,0 +1,217 @@
+
+# This file contains tests adapted from FowardDiff.jl, many of them using DiffTests.jl
+# Organised here file-by-file in alphabetical order!
+
+#####
+##### setup
+#####
+
+using Test, LinearAlgebra
+using ForwardDiff, DiffTests
+using Diffractor, ChainRulesCore
+
+fwd_derivative(f, x::Number) = Diffractor.PrimeDerivativeFwd(f)(x) |> unthunk
+function rev_derivative(f, x::Number)
+    y = f(x)
+    if y isa Number
+        Diffractor.PrimeDerivativeBack(f)(x)
+    elseif y isa AbstractArray
+        map(CartesianIndices(y)) do I
+            Diffractor.PrimeDerivativeBack(x -> f(x)[I])(x) |> unthunk
+        end
+    else
+        throw("can't handle f(x)::$(typeof(y))")
+    end
+end
+
+@test ForwardDiff.derivative(abs2, 3) == 6
+@test fwd_derivative(abs2, 3) == 6
+@test rev_derivative(abs2, 3) == 6
+
+@test ForwardDiff.derivative(x -> fill(x,2,3), 7) == [1 1 1; 1 1 1]
+@test fwd_derivative(x -> fill(x,2,3), 7) == [1 1 1; 1 1 1]
+@test rev_derivative(x -> fill(x,2,3), 7) == [1 1 1; 1 1 1]
+
+DERIVATIVES = (ForwardDiff.derivative, fwd_derivative, rev_derivative)
+
+function fwd_gradient(f, x::AbstractVector)
+    map(eachindex(x)) do i
+        fwd_derivative(ξ -> f(vcat(x[begin:i-1], ξ, x[i+1:end])), x[i])
+    end
+end
+fwd_gradient(f, x::AbstractArray) = reshape(fwd_gradient(v -> f(reshape(v, size(x))), vec(x)), size(x))
+rev_gradient(f, x::AbstractArray) = ChainRulesCore.unthunk(Diffractor.PrimeDerivativeBack(f)(float(x)))
+
+@test ForwardDiff.gradient(prod, [1,2,3]) == [6,3,2]
+@test_broken fwd_gradient(prod, [1,2,3]) == [6,3,2]  # ERROR: MethodError: no method matching arrayset(::Bool, ::Vector{Int64}, ::Int64, ::Int64)
+@test rev_gradient(prod, [1,2,3]) == [6,3,2]
+
+@test fwd_gradient(sum, [1,2]) == [1,1]
+@test_broken fwd_gradient(first, [1,1]) == [1,0]
+
+GRADIENTS = (ForwardDiff.gradient, rev_gradient)
+
+fwd_jacobian(f, x::AbstractArray) = hcat(vec.(fwd_gradient(f, x))...)
+function rev_jacobian(f, x::AbstractArray)
+    y = f(x)
+    slices = map(LinearIndices(y)) do i  # fails if y isa Number, just like ForwardDiff.jacobian
+        vec(rev_gradient(x -> f(x)[i], x))
+    end
+    vcat(transpose(slices)...)
+    # permutedims(hcat(slices...))
+end
+
+@test ForwardDiff.jacobian(x -> x[1:2], [1,2,3]) == [1 0 0; 0 1 0]
+@test_broken fwd_jacobian(x -> x[1:2], [1,2,3]) == [1 0 0; 0 1 0]
+@test rev_jacobian(x -> x[1:2], [1,2,3]) == [1 0 0; 0 1 0]
+
+JACOBIANS = (ForwardDiff.jacobian, rev_jacobian)
+
+fwd_hessian(f, x::AbstractArray) = fwd_jacobian(y -> fwd_gradient(f, y), x)
+rev_hessian(f, x::AbstractArray) = rev_jacobian(y -> rev_gradient(f, y), x)
+fwd_rev_hessian(f, x::AbstractArray) = fwd_jacobian(y -> rev_gradient(f, y), x)
+rev_fwd_hessian(f, x::AbstractArray) = rev_jacobian(y -> fwd_gradient(f, y), x)
+
+@test ForwardDiff.hessian(x -> -log(x[1]), [2,3]) == [0.25 0; 0 0]
+@test rev_hessian(x -> -log(x[1]), [2,3]) == [0.25 0; 0 0]
+
+HESSIANS = (ForwardDiff.hessian, rev_hessian)
+
+
+# const XLEN = 13
+# const YLEN = 7
+# const X, Y = rand(XLEN), rand(YLEN)
+# const CHUNK_SIZES = (1, div(DEFAULT_CHUNK_THRESHOLD, 3), div(DEFAULT_CHUNK_THRESHOLD, 2), DEFAULT_CHUNK_THRESHOLD, DEFAULT_CHUNK_THRESHOLD + 1)
+# const HESSIAN_CHUNK_SIZES = (1, 2, 3)
+# const FINITEDIFF_ERROR = 3e-5
+X, Y = rand(13), rand(7)
+FINITEDIFF_ERROR = 3e-5
+
+
+#####
+##### ConfusionTest
+#####
+
+
+#####
+##### DerivativeTest
+#####
+
+@testset verbose=true "DerivativeTest" begin
+
+    x = 1
+
+    @testset "scalar derivative of DiffTests.$f" for f in DiffTests.NUMBER_TO_NUMBER_FUNCS
+        v = f(x)
+        d = ForwardDiff.derivative(f, x)
+        # @test isapprox(d, Calculus.derivative(f, x), atol=FINITEDIFF_ERROR)
+
+        @test d ≈ fwd_derivative(f, x)  broken=(f==DiffTests.num2num_4)
+        @test d ≈ rev_derivative(f, x)  broken=(f==DiffTests.num2num_4)
+    end
+
+    @testset "array derivative of DiffTests.$f" for f in DiffTests.NUMBER_TO_ARRAY_FUNCS
+        v = f(x)
+        d = ForwardDiff.derivative(f, x)
+        # @test isapprox(d, Calculus.derivative(f, x), atol=FINITEDIFF_ERROR)
+
+        @test d ≈ fwd_derivative(f, x)
+        @test d ≈ rev_derivative(f, x)
+    end
+
+    @testset "exponential function at base zero" for derivative in DERIVATIVES
+        @test (x -> derivative(y -> x^y, -0.5))(0.0) === -Inf
+        @test (x -> derivative(y -> x^y,  0.0))(0.0) === -Inf
+        @test (x -> derivative(y -> x^y,  0.5))(0.0) === 0.0
+        @test (x -> derivative(y -> x^y,  1.5))(0.0) === 0.0
+    end
+
+end
+
+#####
+##### GradientTest
+#####
+
+@testset verbose=true "GradientTest" begin
+
+    @testset "hardcoded rosenbrock gradient" begin
+        f = DiffTests.rosenbrock_1
+        x = [0.1, 0.2, 0.3]
+        v = f(x)
+        g = [-9.4, 15.6, 52.0]
+
+        @test g ≈ ForwardDiff.gradient(f, x)
+        @test_broken g ≈ fwd_gradient(f, x)
+        @test g ≈ rev_gradient(f, x)
+    end
+
+    @testset "gradient of DiffTests.$f" for f in DiffTests.VECTOR_TO_NUMBER_FUNCS
+        v = f(X)
+        g = ForwardDiff.gradient(f, X)
+        # @test isapprox(g, Calculus.gradient(f, X), atol=FINITEDIFF_ERROR)
+
+        @test g ≈ fwd_gradient(f, X)
+        @test g ≈ rev_gradient(f, X)
+    end
+
+    @testset "exponential function at base zero: $gradient" for gradient in GRADIENTS 
+        @test isequal(gradient(t -> t[1]^t[2], [0.0, -0.5]), [NaN, NaN])
+        @test isequal(gradient(t -> t[1]^t[2], [0.0,  0.0]), [NaN, NaN])
+        @test isequal(gradient(t -> t[1]^t[2], [0.0,  0.5]), [Inf, NaN])
+        @test isequal(gradient(t -> t[1]^t[2], [0.0,  1.5]), [0.0, 0.0])
+    end
+
+    @testset "chunk size zero - issue 399: $gradient" for gradient in GRADIENTS
+        f_const(x) = 1.0
+        g_grad_const = x -> gradient(f_const, x)
+        @test g_grad_const([1.0]) == [0.0]
+        @test isempty(g_grad_const(zeros(Float64, 0)))
+    end
+
+    @testset "ArithmeticStyle: $gradient" for gradient in GRADIENTS
+        function f(p)
+            sum(collect(0.0:p[1]:p[2]))
+        end
+        @test gradient(f, [0.2,25.0]) == [7875.0, 0.0]
+    end
+
+end
+
+#####
+##### HessianTest
+#####
+
+@testset verbose=true "HessianTest" begin
+
+    @testset "hardcoded rosenbrock hessian" begin
+
+        f = DiffTests.rosenbrock_1
+        x = [0.1, 0.2, 0.3]
+        v = f(x)
+        g = [-9.4, 15.6, 52.0]
+        h = [-66.0  -40.0    0.0;
+             -40.0  130.0  -80.0;
+               0.0  -80.0  200.0]
+
+        @test isapprox(h, ForwardDiff.hessian(f, x))
+
+        @test_skip h ≈ fwd_hessian(f, x) 
+        @test_broken h ≈ rev_hessian(f, x)  # Control flow support not fully implemented yet for higher-order reverse mode
+        @test_skip h ≈ rev_fwd_hessian(f, x)
+        @test_skip h ≈ fwd_rev_hessian(f, x)
+    end
+
+    @testset "hessians for DiffTests.$f" for f in DiffTests.VECTOR_TO_NUMBER_FUNCS
+        v = f(X)
+        g = ForwardDiff.gradient(f, X)
+        h = ForwardDiff.hessian(f, X)
+
+        @test_broken g ≈ rev_gradient(f, x)
+        @test_broken h ≈ rev_hessian(f, x)
+    end
+
+end
+
+#####
+##### JacobianTest
+#####
diff --git a/test/runtests.jl b/test/runtests.jl
@@ -1,6 +1,9 @@
 using Diffractor
 using Test
 
+@testset verbose=true "from ForwardDiff.jl" begin
+    include("forwarddiff.jl")
+end
 @testset verbose=true "ChainRules integration.jl" begin
     include("chainrules.jl")
 end