JuliaDiff · oxinabox · May 27, 2021 · Dec 26, 2020 · Dec 27, 2020 · Dec 27, 2020
diff --git a/Project.toml b/Project.toml
@@ -1,6 +1,6 @@
 name = "ChainRules"
 uuid = "082447d4-558c-5d27-93f4-14fc19e9eca2"
-version = "0.7.65"
+version = "0.7.66"
 
 [deps]
 ChainRulesCore = "d360d2e6-b24c-11e9-a2a3-2a2ae2dbcce4"

diff --git a/src/rulesets/Base/mapreduce.jl b/src/rulesets/Base/mapreduce.jl
@@ -55,3 +55,84 @@ function rrule(
     end
     return y, sum_abs2_pullback
 end
+
+#####
+##### `prod`
+#####
+
+function rrule(::typeof(prod), x::AbstractArray{T}; dims=:) where {T<:CommutativeMulNumber}
+    y = prod(x; dims=dims)
+    # vald = dims isa Colon ? nothing : dims isa Integer ? Val(Int(dims)) : Val(Tuple(dims))
+    function prod_pullback(dy)
+        x_thunk = InplaceableThunk(
+            # Out-of-place versions
+            @thunk if dims === (:)
+                ∇prod(x, dy, y)
+            elseif any(iszero, x)  # Then, and only then, will ./x lead to NaN
+                vald = dims isa Colon ? nothing : dims isa Integer ? Val(Int(dims)) : Val(Tuple(dims))
+                ∇prod_dims(vald, x, dy, y)  # val(Int(dims)) is about 2x faster than Val(Tuple(dims))
+            else
+                conj.(y ./ x) .* dy
+            end
+            ,
+            # In-place versions -- same branching
+            dx -> if dims === (:)
+                ∇prod!(dx, x, dy, y)
+            elseif any(iszero, x)
+                vald = dims isa Colon ? nothing : dims isa Integer ? Val(Int(dims)) : Val(Tuple(dims))
+                ∇prod_dims!(dx, vald, x, dy, y)
+            else
+                dx .+= conj.(y ./ x) .* dy
+            end
+            )
+        return (NO_FIELDS, x_thunk)
+    end
+    return y, prod_pullback
+end
+
+function ∇prod_dims(vald::Val{dims}, x, dy, y=prod(x; dims=dims)) where {dims}
+    T = promote_type(eltype(x), eltype(dy))
+    dx = fill!(similar(x, T, axes(x)), zero(T))
+    ∇prod_dims!(dx, vald, x, dy, y)
+    return dx
+end
+
+function ∇prod_dims!(dx, ::Val{dims}, x, dy, y) where {dims}
+    iters = ntuple(d -> d in dims ? tuple(:) : axes(x,d), ndims(x))  # Without Val(dims) this is a serious type instability
+    @inbounds for ind in Iterators.product(iters...)
+        jay = map(i -> i isa Colon ? 1 : i, ind)
+        @views ∇prod!(dx[ind...], x[ind...], dy[jay...], y[jay...])
+    end
+    return dx
+end
+
+function ∇prod(x, dy::Number=1, y::Number=prod(x))
+    T = promote_type(eltype(x), eltype(dy))
+    dx = fill!(similar(x, T, axes(x)), zero(T)) # axes(x) makes MArray on StaticArrays, Array for structured matrices
+    ∇prod!(dx, x, dy, y)
+    return dx
+end
+
+function ∇prod!(dx, x, dy::Number=1, y::Number=prod(x))
+    numzero = iszero(y) ? count(iszero, x) : 0
+    if numzero == 0  # This can happen while y==0, if there are several small xs
+        dx .+= conj.(y ./ x) .* dy
+    elseif numzero == 1
+        ∇prod_one_zero!(dx, x, dy)
+    else
+        # numzero > 1, then all first derivatives are zero
+    end
+    return dx
+end
+
+function ∇prod_one_zero!(dx, x, dy::Number=1)  # Assumes exactly one x is zero
+    i_zero = 0
+    p_rest = one(promote_type(eltype(x), typeof(dy)))
+    for i in eachindex(x)
+        xi = @inbounds x[i]
+        p_rest *= ifelse(iszero(xi), one(xi), conj(xi))
+        i_zero = ifelse(iszero(xi), i, i_zero)
+    end
+    dx[i_zero] += p_rest * dy
+    return
+end
diff --git a/test/rulesets/Base/mapreduce.jl b/test/rulesets/Base/mapreduce.jl
@@ -20,4 +20,60 @@
             end
         end
     end  # sum abs2
+
+    @testset "prod" begin
+        @testset "Array{$T}" for T in [Float64, ComplexF64]
+            @testset "size = $sz, dims = $dims" for (sz, dims) in [
+                ((12,), :), ((12,), 1),
+                ((3,4), 1), ((3,4), 2), ((3,4), :), ((3,4), [1,2]),
+                ((3,4,1), 1), ((3,2,2), 3), ((3,2,2), 2:3),
+                ]
+                x = randn(T, sz)
+                test_rrule(prod, x; fkwargs=(dims=dims,), check_inferred=true)
+                x[1] = 0
+                test_rrule(prod, x; fkwargs=(dims=dims,), check_inferred=true)
+                x[5] = 0
+                test_rrule(prod, x; fkwargs=(dims=dims,), check_inferred=true)
+                x[3] = x[7] = 0  # two zeros along some slice, for any dims
+                test_rrule(prod, x; fkwargs=(dims=dims,), check_inferred=true)
+
+                if ndims(x) == 3
+                    xp = PermutedDimsArray(x, (3,2,1))  # not a StridedArray
+                    xpdot, xpbar = permutedims(rand(T, sz), (3,2,1)), permutedims(rand(T, sz), (3,2,1))
+                    test_rrule(prod, xp ⊢ xpbar; fkwargs=(dims=dims,), check_inferred=true)
+                end
+            end
+
+            @testset "structured wrappers" begin
+                # Adjoint -- like PermutedDimsArray this may actually be used
+                xa = adjoint(rand(T,4,4))
+                test_rrule(prod, xa ⊢ rand(T,4,4))
+                test_rrule(prod, xa ⊢ rand(T,4,4), fkwargs=(dims=2,))
+                @test unthunk(rrule(prod, adjoint(rand(T,3,3)))[2](1.0)[2]) isa Matrix
+                @test unthunk(rrule(prod, adjoint(rand(T,3,3)), dims=1)[2](ones(1,3))[2]) isa Matrix
+
+                # Diagonal -- a stupid thing to do, product of zeros! Shouldn't be an error though:
+                @test iszero(unthunk(rrule(prod, Diagonal(rand(T,3)))[2](1.0)[2]))
+                @test iszero(unthunk(rrule(prod, Diagonal(rand(T,3)), dims=1)[2](ones(1,3))[2]))
+                @test unthunk(rrule(prod, Diagonal(rand(T,1)))[2](1.0)[2]) == hcat(1) # 1x1 sparse matrix
+                @test unthunk(rrule(prod, Diagonal(ones(T,2)), dims=1)[2](ones(1,2))[2]) == [0 1; 1 0]
+
+                # Triangular -- almost equally stupud
+                @test iszero(unthunk(rrule(prod, UpperTriangular(rand(T,3,3)))[2](1.0)[2]))
+                @test unthunk(rrule(prod, UpperTriangular(ones(T,2,2)))[2](1.0)[2]) == [0 0; 1 0]
+
+                # Symmetric -- at least this doesn't have zeros, still an unlikely combination
+                xs = Symmetric(rand(T,4,4))
+                @test_skip test_rrule(prod, xs ⊢ rand(T,4,4))
+                @test_skip test_rrule(prod, xs ⊢ rand(T,4,4), fkwargs=(dims=2,))
+                @test unthunk(rrule(prod, Symmetric(T[1 2; -333 4]))[2](1.0)[2]) == [16 8; 8 4]
+            end
+        end
+        @testset "Array{Float32}, no zero entries" begin
+            v = [1f-5, 1f-10, 1f-15, 1f-20]
+            @test prod(v) == 0
+            @test unthunk(rrule(prod, v)[2](1f0)[2]) == zeros(4)
+            test_rrule(prod, v)
+        end
+    end # prod
 end