probcomp · bzinberg · Aug 2, 2021 · Jul 14, 2021 · Jul 14, 2021 · Jul 14, 2021
diff --git a/src/modeling_library/distributions/normal.jl b/src/modeling_library/distributions/normal.jl
@@ -65,8 +65,6 @@ function logpdf(::BroadcastedNormal,
     assert_has_shape(x, broadcast_shapes_or_crash(mu, std);
                      msg="Shape of `x` does not agree with the sample space")
     z = (x .- mu) ./ std
-    var = std .* std
-    diff = x .- mu
     sum(- (abs2.(z) .+ log(2π)) / 2 .- log.(std))
 end
 
@@ -85,10 +83,29 @@ function logpdf_grad(::BroadcastedNormal,
     assert_has_shape(x, broadcast_shapes_or_crash(mu, std);
                      msg="Shape of `x` does not agree with the sample space")
     z = (x .- mu) ./ std
-    deriv_x = sum(- z ./ std)
+    deriv_x = - z ./ std
     deriv_mu = -deriv_x
-    deriv_std = sum(-1. ./ std .+ abs2.(z) ./ std)
-    (deriv_x, deriv_mu, deriv_std)
+    deriv_std = -1. ./ std .+ abs2(z) ./ std
+    (unbroadcast_for_arg(x, deriv_x), 
+    unbroadcast_for_arg(mu, deriv_mu), 
+    unbroadcast_for_arg(std, deriv_std))
+end
+
+unbroadcast_for_arg(::Real, grad) = sum(grad)
+unbroadcast_for_arg(::Array{Float64, 0}, grad::Real) = fill(grad)
+function unbroadcast_for_arg(
+    arg::AbstractArray{<:Real, N}, grad::AbstractArray{T}
+)::AbstractArray{T, N} where {N,T}
+    size(arg) == size(grad) ? grad : unbroadcast_grad(size(arg), grad)
+end
+
+function unbroadcast_grad(
+    old_shape::NTuple{l_old, Int}, grad::AbstractArray{T, l_new}
+) where {T, l_old, l_new}
+    @assert l_new >= l_old  
+    new_shape = size(grad)
+    dims=filter(i -> i > l_old || old_shape[i] == 1 && new_shape[i] > 1, 1:l_new)
+    dropdims(sum(grad; dims=dims); dims=tuple((l_old+1:l_new)...))::AbstractArray{T, l_old}
 end
 
 random(::Normal, mu::Real, std::Real) = mu + std * randn()

diff --git a/test/modeling_library/distributions.jl b/test/modeling_library/distributions.jl
@@ -126,9 +126,9 @@ end
     f = (x, mu, std) -> logpdf(broadcasted_normal, x, mu, std)
     args = (fill(0.4), fill(0.2), fill(0.3))
     actual = logpdf_grad(broadcasted_normal, args...)
-    @test isapprox(actual[1], finite_diff(f, args, 1, dx; broadcast=true))
-    @test isapprox(actual[2], finite_diff(f, args, 2, dx; broadcast=true))
-    @test isapprox(actual[3], finite_diff(f, args, 3, dx; broadcast=true))
 pos_args[i] = copy(args[i]) .+ dx 
 neg_args[i] = copy(args[i]) .- dx 
 pos_args[i] = copy(args[i]) .+ dx 
 neg_args[i] = copy(args[i]) .- dx 
+    @test isapprox(actual[1][], finite_diff(f, args, 1, dx))
+    @test isapprox(actual[2][], finite_diff(f, args, 2, dx))
+    @test isapprox(actual[3][], finite_diff(f, args, 3, dx))
 end
 
 @testset "array normal (trivially broadcasted: all args have same shape)" begin