JuliaDiff
diff --git a/‎src/derivatives/elementwise.jl
Lines changed: 88 additions & 22 deletions b/‎src/derivatives/elementwise.jl
Lines changed: 88 additions & 22 deletions
diff --git a/‎test/derivatives/ElementwiseTests.jl
Lines changed: 222 additions & 0 deletions b/‎test/derivatives/ElementwiseTests.jl
Lines changed: 222 additions & 0 deletions
@@ -2,7 +2,7 @@
 # forward #
 ###########
 
-function dualwrap{N,T,A}(duals::AbstractArray{Dual{N,T}}, ::Type{A}, tp::Nullable{Tape})
+function retrack_duals{N,T,A}(duals::AbstractArray{Dual{N,T}}, ::Type{A}, tp::Nullable{Tape})
     ts = similar(duals, Tracked{T,A})
     for i in eachindex(duals)
         ts[i] = Tracked(value(duals[i]), A, tp)
@@ -19,7 +19,7 @@ for A in ARRAY_TYPES
                 fdual = t -> fopt.f(Dual(value(t), one(V)))
                 duals = $(g)(fdual, x)
                 tp = tape(x)
-                out = dualwrap(duals, S, tp)
+                out = retrack_duals(duals, S, tp)
                 record!(tp, $(g), x, out, duals)
                 return out
             end
@@ -31,10 +31,32 @@ for A in ARRAY_TYPES
                                            Dual(value(t2), zero(V2), one(V2)))
                 duals = $(g)(fdual, x1, x2)
                 tp = tape(x1, x2)
-                out = dualwrap(duals, S, tp)
+                out = retrack_duals(duals, S, tp)
                 record!(tp, $(g), (x1, x2), out, duals)
                 return out
             end
+
+            function Base.$(g){F,V,S}(fopt::ForwardOptimize{F},
+                                      x1::$(A){Tracked{V,S}},
+                                      x2::$(A))
+                fdual = (t1, t2) -> fopt.f(Dual(value(t1), one(V)), t2)
+                duals = $(g)(fdual, x1, x2)
+                tp = tape(x1)
+                out = retrack_duals(duals, S, tp)
+                record!(tp, $(g), x1, out, duals)
+                return out
+            end
+
+            function Base.$(g){F,V,S}(fopt::ForwardOptimize{F},
+                                      x1::$(A),
+                                      x2::$(A){Tracked{V,S}})
+                fdual = (t1, t2) -> fopt.f(t1, Dual(value(t2), one(V)))
+                duals = $(g)(fdual, x1, x2)
+                tp = tape(x2)
+                out = retrack_duals(duals, S, tp)
+                record!(tp, $(g), x2, out, duals)
+                return out
+            end
         end
     end
 
@@ -58,7 +80,7 @@ for A in ARRAY_TYPES
             fdual = t -> fopt.f(ndual, Dual(value(t), zero(X), one(X)))
             duals = broadcast(fdual, x)
             tp = tape(n, x)
-            out = dualwrap(duals, S, tp)
+            out = retrack_duals(duals, S, tp)
             record!(tp, broadcast, (n, x), out, duals)
             return out
         end
@@ -68,10 +90,30 @@ for A in ARRAY_TYPES
             fdual = t -> fopt.f(Dual(value(t), one(X), zero(X)), ndual)
             duals = broadcast(fdual, x)
             tp = tape(n, x)
-            out = dualwrap(duals, S, tp)
+            out = retrack_duals(duals, S, tp)
             record!(tp, broadcast, (x, n), out, duals)
             return out
         end
+
+        function Base.broadcast{F,V,S}(fopt::ForwardOptimize{F}, n::Tracked{V,S}, x::$(A))
+            ndual = Dual(value(n), one(V))
+            fdual = t -> fopt.f(ndual, t)
+            duals = broadcast(fdual, x)
+            tp = tape(n)
+            out = retrack_duals(duals, S, tp)
+            record!(tp, broadcast, n, out, duals)
+            return out
+        end
+
+        function Base.broadcast{F,V,S}(fopt::ForwardOptimize{F}, x::$(A), n::Tracked{V,S})
+            ndual = Dual(value(n), one(V))
+            fdual = t -> fopt.f(t, ndual)
+            duals = broadcast(fdual, x)
+            tp = tape(n)
+            out = retrack_duals(duals, S, tp)
+            record!(tp, broadcast, n, out, duals)
+            return out
+        end
     end
 
     # standard elementwise operations (.+, .-, .*, etc.) #
@@ -82,13 +124,29 @@ for A in ARRAY_TYPES
                 return broadcast(ForwardOptimize($(f)), x, y)
             end
 
+            @inline function Base.$(f){X<:Tracked}(x::$(A){X}, y::$(A))
+                return broadcast(ForwardOptimize($(f)), x, y)
+            end
+
+            @inline function Base.$(f){Y<:Tracked}(x::$(A), y::$(A){Y})
+                return broadcast(ForwardOptimize($(f)), x, y)
+            end
+
             @inline function Base.$(f){T<:Tracked}(n::Tracked, x::$(A){T})
                 return broadcast(ForwardOptimize($(f)), n, x)
             end
 
             @inline function Base.$(f){T<:Tracked}(x::$(A){T}, n::Tracked)
                 return broadcast(ForwardOptimize($(f)), x, n)
             end
+
+            @inline function Base.$(f)(n::Tracked, x::$(A))
+                return broadcast(ForwardOptimize($(f)), n, x)
+            end
+
+            @inline function Base.$(f)(x::$(A), n::Tracked)
+                return broadcast(ForwardOptimize($(f)), x, n)
+            end
         end
         for R in REAL_TYPES
             @eval begin
@@ -138,26 +196,34 @@ function special_reverse_step!{A,B}(::typeof(broadcast), inputs::Tuple{A,B}, out
     if size(a) == size(b)
         special_reverse_step!(map, inputs, output, duals)
     else
-        for i in eachindex(duals)
-            duals[i] *= adjoint(output[i])
-        end
-        s = sumover(1, a, duals)
-        increment_adjoint!(a, s)
-        increment_adjoint!(b, sumover(2, b, duals))
+        broadcast_adjoint_reduce!(a, output, duals, 1)
+        broadcast_adjoint_reduce!(b, output, duals, 2)
     end
     return nothing
 end
 
-# Inference here is pretty wonky (see JuliaLang/julia#10533),
-# so it's important that we allocate the array for the sum
-# result ourselves. Otherwise, `reducedim_init` tries to
-# allocate an array of the wrong type in some cases, which
-# leads to conversion errors.
-function sumover{N,M,T}(p, x::AbstractArray, duals::AbstractArray{Dual{N,T},M})
-    dims = (size(x, i) != size(duals, i) ? 1 : size(duals, i) for i in 1:ndims(duals))
-    result = similar(duals, T, (dims...)::NTuple{M,Int})
-    sum!(d -> partials(d, p), result, duals)
-    return result
+function special_reverse_step!(::typeof(broadcast), input::Number, output, duals)
+    broadcast_adjoint_reduce!(input, output, duals, 1)
+    return nothing
+end
+
+# This strategy should be pretty fast, but it might be prone to numerical error if the
+# accumulated adjoint becomes too large compared to the individual terms being added to
+# it. This can be overcome by using the divide-and-conquer strategy used by
+# Base.mapreducedim, but that strategy is less cache efficient and more complicated to
+# implement.
+function broadcast_adjoint_reduce!{T,N}(input::AbstractArray, output::AbstractArray{T,N}, duals, p)
+    dims = (size(input, i) != size(duals, i) ? 1 : size(duals, i) for i in 1:ndims(duals))
+    max_index = CartesianIndex((dims...)::NTuple{N,Int})
+    for i in CartesianRange(size(input))
+        increment_adjoint!(input[min(max_index, i)], adjoint(output[i]) * partials(duals[i], p))
+    end
+    return nothing
 end
 
-sumover(p, x::Real, duals) = sum(d -> partials(d, p), duals)
+function broadcast_adjoint_reduce!{T,N}(input::Number, output::AbstractArray{T,N}, duals, p)
+    for i in eachindex(duals)
+        increment_adjoint!(input, adjoint(output[i]) * partials(duals[i], p))
+    end
+    return nothing
+end
@@ -0,0 +1,222 @@
+# module ElementwiseTests
+
+using ReverseDiffPrototype, ForwardDiff, Base.Test
+
+include("../utils.jl")
+
+println("testing elementwise derivatives (both forward and reverse passes)")
+tic()
+
+############################################################################################
+x, a, b, n = rand(3, 3), rand(3, 3), rand(3, 3), rand()
+tp = Tape()
+
+function test_elementwise(f, x, tp)
+    xt = track(x, tp)
+    y = map(f, x)
+
+    out = similar(y, (length(x), length(x)))
+    yt = map(RDP.@forward(f), xt)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, yt, xt, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(z -> map(f, z), x) EPS
+    empty!(tp)
+
+    y = broadcast(RDP.@forward(f), x)
+    out = similar(y, (length(x), length(x)))
+    yt = broadcast(RDP.@forward(f), xt)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, yt, xt, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(z -> broadcast(f, z), x) EPS
+    empty!(tp)
+end
+
+function test_map(f, a, b, tp)
+    at, bt = track(a, tp), track(b, tp)
+    c = map(f, a, b)
+
+    out = similar(c, (length(a), length(a)))
+    ct = map(RDP.@forward(f), at, b)
+    @test ct == c
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, ct, at, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(x -> map(f, x, b), a) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out = similar(c, (length(a), length(a)))
+    ct = map(RDP.@forward(f), a, bt)
+    @test ct == c
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, ct, bt, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(x -> map(f, a, x), b) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out_a = similar(c, (length(a), length(a)))
+    out_b = similar(c, (length(a), length(a)))
+    ct = map(RDP.@forward(f), at, bt)
+    @test ct == c
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out_a, ct, at, tp)
+    RDP.jacobian_reverse_pass!(out_b, ct, bt, tp)
+    @test_approx_eq_eps out_a ForwardDiff.jacobian(x -> map(f, x, b), a) EPS
+    @test_approx_eq_eps out_b ForwardDiff.jacobian(x -> map(f, a, x), b) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+end
+
+function test_broadcast(f, a::AbstractArray, b::AbstractArray, tp, builtin = false)
+    at, bt = track(a, tp), track(b, tp)
+
+    if builtin
+        g = RDP.@forward(f)
+    else
+        g = (x, y) -> broadcast(RDP.@forward(f), x, y)
+    end
+
+    c = g(a, b)
+
+    out = similar(c, (length(c), length(a)))
+    ct = g(at, b)
+    @test ct == c
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, ct, at, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(x -> g(x, b), a) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out = similar(c, (length(c), length(b)))
+    ct = g(a, bt)
+    @test ct == c
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, ct, bt, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(x -> g(a, x), b) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out_a = similar(c, (length(c), length(a)))
+    out_b = similar(c, (length(c), length(b)))
+    ct = g(at, bt)
+    @test ct == c
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out_a, ct, at, tp)
+    RDP.jacobian_reverse_pass!(out_b, ct, bt, tp)
+    @test_approx_eq_eps out_a ForwardDiff.jacobian(x -> g(x, b), a) EPS
+    @test_approx_eq_eps out_b ForwardDiff.jacobian(x -> g(a, x), b) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+end
+
+function test_broadcast(f, n::Number, x::AbstractArray, tp, builtin = false)
+    nt, xt = track(n, tp), track(x, tp)
+
+    if builtin
+        g = RDP.@forward(f)
+    else
+        g = (x, y) -> broadcast(RDP.@forward(f), x, y)
+    end
+
+    y = g(n, x)
+
+    out = similar(y)
+    yt = g(nt, x)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, yt, [nt], tp)
+    @test_approx_eq_eps out ForwardDiff.derivative(z -> g(z, x), n) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out = similar(y, (length(y), length(x)))
+    yt = g(n, xt)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, yt, xt, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(z -> g(n, z), x) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out_n = similar(y)
+    out_x = similar(y, (length(y), length(x)))
+    yt = g(nt, xt)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out_n, yt, [nt], tp)
+    RDP.jacobian_reverse_pass!(out_x, yt, xt, tp)
+    @test_approx_eq_eps out_n ForwardDiff.derivative(z -> g(z, x), n) EPS
+    @test_approx_eq_eps out_x ForwardDiff.jacobian(z -> g(n, z), x) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+end
+
+function test_broadcast(f, x::AbstractArray, n::Number, tp, builtin = false)
+    xt, nt = track(x, tp), track(n, tp)
+
+    if builtin
+        g = RDP.@forward(f)
+    else
+        g = (x, y) -> broadcast(RDP.@forward(f), x, y)
+    end
+
+    y = g(x, n)
+
+    out = similar(y)
+    yt = g(x, nt)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, yt, [nt], tp)
+    @test_approx_eq_eps out ForwardDiff.derivative(z -> g(x, z), n) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out = similar(y, (length(y), length(x)))
+    yt = g(xt, n)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out, yt, xt, tp)
+    @test_approx_eq_eps out ForwardDiff.jacobian(z -> g(z, n), x) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+
+    out_n = similar(y)
+    out_x = similar(y, (length(y), length(x)))
+    yt = g(xt, nt)
+    @test yt == y
+    @test length(tp) == 1
+    RDP.jacobian_reverse_pass!(out_n, yt, [nt], tp)
+    RDP.jacobian_reverse_pass!(out_x, yt, xt, tp)
+    @test_approx_eq_eps out_n ForwardDiff.derivative(z -> g(x, z), n) EPS
+    @test_approx_eq_eps out_x ForwardDiff.jacobian(z -> g(z, n), x) EPS
+    RDP.unseed!(tp)
+    empty!(tp)
+end
+
+for f in (sin, cos, tan, exp, x -> 1. / (1. + exp(-x)))
+    testprintln("unary scalar functions", f)
+    test_elementwise(f, x, tp)
+end
+
+for fsym in RDP.FORWARD_BINARY_SCALAR_FUNCS
+    f = eval(fsym)
+    testprintln("binary scalar functions", f)
+    test_map(f, a, b, tp)
+    test_broadcast(f, a, b, tp)
+    test_broadcast(f, n, x, tp)
+    test_broadcast(f, x, n, tp)
+end
+
+for f in (.+, .-, .*, ./, .\, .^)
+    testprintln("built-in broadcast functions", f)
+    test_broadcast(f, a, b, tp, true)
+    test_broadcast(f, n, x, tp, true)
+    test_broadcast(f, x, n, tp, true)
+end
+
+############################################################################################
+
+println("done (took $(toq()) seconds)")
+
+# end # module