Gradient prototype implementation, Val{:central} with Val{:Real} should work.

dextorious · ChrisRackauckas · commit 09101c79193f · 2018-02-15T06:44:32.000-08:00
diff --git a/src/derivatives.jl b/src/derivatives.jl
@@ -82,38 +82,38 @@ function DerivativeCache(
         Val{:Complex} : Val{:Real}
     )
 
-    if typeof(x)<:StridedArray && typeof(fx)<:Union{Void,StridedArray}
-        if typeof(epsilon)!=Void
-            warn("StridedArrays don't benefit from pre-allocating epsilon.")
-            epsilon = nothing
-        end
+    if fdtype == Val{:complex} && RealOrComplex == Val{:Complex}
+        fdtype_error(Val{:Complex})
     end
-    if fdtype == Val{:complex}
-        if RealOrComplex == Val{:Complex}
-            fdtype_error(Val{:Complex})
-        end
-        if typeof(fx) != Void || typeof(epsilon) != Void
-            warn("Val{:complex} doesn't benefit from cache arrays.")
-        end
-        return DerivativeCache{Void,Void,fdtype,RealOrComplex}(nothing, nothing)
+
+    if fdtype != Val{:forward}
+        warn("Pre-computed function values are only useful for fdtype == Val{:forward}.")
+        _fx = nothing
+    else
+        # more runtime sanity checks?
+        _fx = fx
+    end
+
+    if typeof(epsilon) == Void
+        _epsilon = nothing
     else
-        if !(typeof(x)<:StridedArray && typeof(fx)<:Union{Void,StridedArray})
+        if typeof(x)<:StridedArray && typeof(fx)<:Union{Void,StridedArray}
+            warn("StridedArrays don't benefit from pre-allocating epsilon.")
+            _epsilon = nothing
+        elseif fdtype == Val{:complex}
+            warn("Val{:complex} makes the epsilon array redundant.")
+            _epsilon = nothing
+        else
             epsilon_elemtype = compute_epsilon_elemtype(epsilon, x)
             if typeof(epsilon) == Void || eltype(epsilon) != epsilon_elemtype
                 epsilon = zeros(epsilon_elemtype, size(x))
             end
             epsilon_factor = compute_epsilon_factor(fdtype, real(eltype(x)))
             @. epsilon = compute_epsilon(fdtype, real(x), epsilon_factor)
-        end
-        if fdtype != Val{:forward}
-            if typeof(fx) != Void
-                warn("Pre-computed function values are only useful for fdtype == Val{:forward}.")
-            end
-            return DerivativeCache{Void,typeof(epsilon),fdtype,RealOrComplex}(nothing,epsilon)
-        else
-            return DerivativeCache{typeof(fx),typeof(epsilon),fdtype,RealOrComplex}(fx,epsilon)
+            _epsilon = epsilon
         end
     end
+    DerivativeCache{typeof(_fx),typeof(_epsilon),fdtype,RealOrComplex}(_fx,_epsilon)
 end
 
 #=
diff --git a/src/gradients.jl b/src/gradients.jl
@@ -1,36 +1,167 @@
-struct GradientCache{CacheType,CacheType2,CacheType3,fdtype,RealOrComplex}
-    x1::CacheType
-    fx::CacheType2
-    fx1::CacheType3
-end
-
-function GradientCache(x1,fx,_fx1,fdtype::DataType=Val{:central},
-                       RealOrComplex::DataType =
-                       fdtype==Val{:complex} ? Val{:Real} : eltype(x1) <: Complex ?
-                       Val{:Complex} : Val{:Real})
-    if fdtype == Val{:complex} && _fx1 != nothing
-        warn("fx1 cache is ignored when fdtype == Val{:complex}.")
-        fx1 = nothing
+struct GradientCache{CacheType, CacheType2, CacheType3, fdtype, RealOrComplex}
+    fx :: CacheType1
+    c1 :: CacheType2
+    c2 :: CacheType3
+end
+
+function GradientCache(
+    df     :: AbstractArray{<:Number},
+    x      :: Union{<:Number, AbstractArray{<:Number}},
+    fx     :: Union{Void,AbstractArray{<:Number}} = nothing,
+    c1     :: AbstractArray{<:Number} = nothing,
+    c2     :: AbstractArray{<:Number} = nothing,
+    fdtype :: DataType = Val{:central},
+    RealOrComplex :: DataType =
+        fdtype==Val{:complex} ? Val{:Real} : eltype(x1) <: Complex ? Val{:Complex} : Val{:Real}
+    )
+
+    if fdtype == Val{:complex} && RealOrComplex == Val{:Complex}
+        fdtype_error(Val{:Complex})
+    end
+
+    if fdtype != Val{:forward}
+        warn("Pre-computed function values are only useful for fdtype == Val{:forward}.")
+        _fx = nothing
+    else
+        # more runtime sanity checks?
+        _fx = fx
+    end
+
+    if typeof(x) <: AbstractArray # the f:R^n->R case
+        # need cache arrays for epsilon and x1
+        epsilon_elemtype = compute_epsilon_elemtype(epsilon, x)
+        if typeof(c1) == Void || eltype(c1) != epsilon_elemtype
+            _c1 = zeros(epsilon_elemtype, size(x))
+        else
+            _c1 = c1
+        end
+        epsilon_factor = compute_epsilon_factor(fdtype, real(eltype(x)))
+        @. _c1 = compute_epsilon(fdtype, real(x), epsilon_factor)
+
+        if typeof(c2) != typeof(x) || size(c2) != size(x)
+            _c2 = copy(x)
+        else
+            copy!(_c2, x)
+        end
+    else # the f:R->R^n case
+        # need cache arrays for fx1 and fx2
+        if typeof(c1) != typeof(df) || size(c1) != size(df)
+            _c1 = similar(df)
+        else
+            _c1 = c1
+        end
+        if typeof(c2) != typeof(df) || size(c2) != size(df)
+            _c2 = similar(df)
+        else
+            _c2 = c2
+        end
+    end
+    GradientCache{typeof(fx),typeof(c1),typeof(c2),fdtype,RealOrComplex}(fx,c1,c2)
+end
+
+function finite_difference_gradient(f, x, fdtype::DataType=Val{:central},
+    RealOrComplex::DataType =
+        fdtype==Val{:complex} ? Val{:Real} : eltype(x) <: Complex ? Val{:Complex} : Val{:Real},
+    fx::Union{Void,AbstractArray{<:Number}}=nothing,
+    c1::Union{Void,AbstractArray{<:Number}}=nothing,
+    c2::Union{Void,AbstractArray{<:Number}}=nothing,
+    )
+
+    if typeof(x) <: AbstractArray
+        df = similar(x)
     else
-        fx1 = _fx1
+        df = similar(f(x))  # can we get rid of this by requesting more information?
     end
-    GradientCache{typeof(x1),typeof(fx),typeof(fx1),
-                  fdtype,RealOrComplex}(x1,fx,fx1)
+    cache = GradientCache(df,x,fx,c1,c2,fdtype,RealOrComplex)
+    finite_difference_gradient!(df,f,x,cache)
 end
 
-function finite_difference_gradient(f,x,fdtype=Val{:central},
-                    RealOrComplex::DataType =
-                    fdtype==Val{:complex} ? Val{:Real} : eltype(x) <: Complex ?
-                    Val{:Complex} : Val{:Real})
-    x1 = similar(x)
-    fx = similar(x)
-    fx1 = similar(x)
-    cache = GradientCache(x1,fx,fx1,fdtype,RealOrComplex)
-    finite_difference_gradient(f,x,cache)
+function finite_difference_gradient!(df, f, x, fdtype::DataType=Val{:central},
+    RealOrComplex::DataType =
+        fdtype==Val{:complex} ? Val{:Real} : eltype(x) <: Complex ? Val{:Complex} : Val{:Real},
+    fx::Union{Void,AbstractArray{<:Number}}=nothing,
+    c1::Union{Void,AbstractArray{<:Number}}=nothing,
+    c2::Union{Void,AbstractArray{<:Number}}=nothing,
+    )
+
+    cache = GradientCache(df,x,fx,c1,c2,fdtype,RealOrComplex)
+    finite_difference_gradient!(df,f,x,cache)
 end
 
 function finite_difference_gradient(f,x,cache::GradientCache)
-    G = zeros(eltype(x), length(x), length(x))
-    finite_difference_gradient!(J,f,x,cache)
-    J
+    if typeof(x) <: AbstractArray
+        df = similar(x)
+    else
+        df = similar(cache.c1)
+    end
+    finite_difference_gradient!(df,f,x,cache)
+    df
+end
+
+# vector of derivatives of f : R^n -> R by each component of a vector x
+function finite_difference_gradient!(df::AbstractArray{<:Number}, f, x::AbstractArray{<:Number},
+    cache::GradientCache{T1,T2,T3,fdtype,Val{:Real}}) where {T1,T2,T3,fdtype}
+
+    # NOTE: in this case epsilon is a vector, we need two arrays for epsilon and x1
+    # c1 denotes epsilon (pre-computed by the cache constructor),
+    # c2 is x1, pre-set to the values of x by the cache constructor
+    fx, c1, c2 = cache.fx, cache.c1, cache.c2
+    if fdtype == Val{:forward}
+        # TODO: do we even need c2 for the forward case?
+        @inbounds for i ∈ eachindex(x)
+            c2[i] += c1[i]
+            df[i]  = (f(c2) - f(x)) / c1[i]
+            c2[i] -= c1[i]
+        end
+    elseif fdtype == Val{:central}
+        @inbounds for i ∈ eachindex(x)
+            #copy!(x1,x)
+            c2[i] += c1[i]
+            x[i]  -= c1[i]
+            df[i]  = (f(c2) - f(x)) / (2*c1[i])
+            c2[i] -= c1[i]
+            x[i]  += c1[i] # revert any changes to x
+        end
+    elseif fdtype == Val{:complex}
+        # TODO
+    end
+    df
+end
+
+# vector of derivatives of f : R -> R^n
+# this is effectively a vector of partial derivatives, but we still call it a gradient
+function finite_difference_gradient!(df::AbstractArray{<:Number}, f, x::Number,
+    cache::GradientCache{T1,T2,T3,fdtype,Val{:Real}}) where {T1,T2,T3,fdtype}
+
+    # NOTE: in this case epsilon is a scalar, we need two arrays for fx1 and fx2
+    # c1 denotes fx1, c2 is fx2, sizes guaranteed by the cache constructor
+    fx, c1, c2 = cache.fx, cache.c1, cache.c2
+
+    if fdtype == Val{:forward}
+        # TODO
+    elseif fdtype == Val{:central}
+        c1 .= f(x+epsilon)
+        c2 .= f(x-epsilon)
+        @inbounds for i ∈ 1 : length(fx)
+            df[i] = (f(x+epsilon)[1] - f(x-epsilon)[1]) / (2*epsilon)
+        end
+    elseif fdtype == Val{:complex}
+        # TODO
+    end
+    df
+end
+
+
+function finite_difference_gradient!(df::AbstractArray{<:Number}, f, x::AbstractArray{<:Number},
+    cache::GradientCache{T1,T2,T3,fdtype,Val{:Complex}}) where {T1,T2,T3,fdtype}
+
+    # TODO
+    df
+end
+
+function finite_difference_gradient!(df::AbstractArray{<:Number}, f, x::Number,
+    cache::GradientCache{T1,T2,T3,fdtype,Val{:Complex}}) where {T1,T2,T3,fdtype}
+
+    # TODO
+    df
 end