Constant (scalar) variance in ConditionalMvNormal mapping (#42)

nmheim · web-flow · commit e0cd6bcd7426 · 2020-10-26T22:03:21.000+01:00
diff --git a/src/cond_mvnormal.jl b/src/cond_mvnormal.jl
@@ -47,9 +47,18 @@ function condition(p::ConditionalMvNormal, z::AbstractMatrix)
     BatchMvNormal(μ,σ)
 end
 
+# dispatches for different outputs from mappings
+# general case
 mean_var(x::Tuple) = x
+# single output assumes σ=1
 mean_var(x::AbstractVector) = (x, 1)
 mean_var(x::AbstractMatrix) = (x, fillsimilar(x,size(x,2),1))
+# fixed scalar variance
+# mean_var(x::Tuple{<:AbstractVector,<:Real}) = x; is already coverged
+function mean_var(x::Tuple{<:AbstractMatrix,<:Real})
+    (μ,σ) = x
+    (μ,fillsimilar(μ,size(μ,2),σ))
+end
 
 # TODO: this should be moved to DistributionsAD
 Distributions.mean(p::TuringDiagMvNormal) = p.m
diff --git a/test/cond_mvnormal.jl b/test/cond_mvnormal.jl
@@ -46,7 +46,6 @@
 
     # BatchScalMvNormal
     m = SplitLayer(zlength, [xlength,1])
-    d = MvNormal(zeros(Float32,xlength), 1f0)
     p = ConditionalMvNormal(m) |> gpu
 
     res = condition(p, rand(zlength,batchsize)|>gpu)
@@ -70,7 +69,6 @@
 
     # Unit variance
     m = Dense(zlength,xlength)
-    d = MvNormal(zeros(Float32,xlength), 1f0)
     p = ConditionalMvNormal(m) |> gpu
 
     res = condition(p, rand(zlength,batchsize)|>gpu)
@@ -90,4 +88,30 @@
 
     f() = sum(rand(p,z))
     @test_nowarn Flux.gradient(f, ps)
+
+
+    # Fixed scalar variance
+    m = Dense(zlength,xlength)
+    σ(x::AbstractVector) = 2
+    σ(x::AbstractMatrix) = ones(Float32,size(x,2)) .* 2
+    p = ConditionalMvNormal(SplitLayer(m,σ)) |> gpu
+
+    res = condition(p, rand(zlength,batchsize)|>gpu)
+    μ = mean(res)
+    σ2 = var(res)
+    @test res isa ConditionalDists.BatchScalMvNormal
+    @test size(μ) == (xlength,batchsize)
+    @test size(σ2) == (xlength,batchsize)
+
+    x = rand(Float32, xlength, batchsize) |> gpu
+    z = rand(Float32, zlength, batchsize) |> gpu
+    loss() = sum(logpdf(p,x,z))
+    ps = Flux.params(p)
+    @test length(ps) == 2
+    @test loss() isa Float32
+    @test_nowarn gs = Flux.gradient(loss, ps)
+
+    f() = sum(rand(p,z))
+    @test_nowarn Flux.gradient(f, ps)
+
 end