Merge pull request #30 from TensorBFS/jg/sampling

mroavi · web-flow · commit 550867aa0cce · 2023-07-10T09:57:20.000+02:00
Improve the performance of sampling
diff --git a/src/sampling.jl b/src/sampling.jl
@@ -10,7 +10,7 @@ The sampled configurations are stored in `samples`, which is a vector of vector.
 The `setmask` is an boolean indicator to denote whether the sampling process of a variable is complete.
 """
 struct Samples{L}
-    samples::Vector{Vector{Int}}
+    samples::Matrix{Int}  # size is nvars × nsample
     labels::Vector{L}
     setmask::BitVector
 end
@@ -23,7 +23,7 @@ function setmask!(samples::Samples, eliminated_variables)
     return samples
 end
 
-idx4labels(totalset, labels) = map(v->findfirst(==(v), totalset), labels)
+idx4labels(totalset, labels)::Vector{Int} = map(v->findfirst(==(v), totalset), labels)
 
 """
 $(TYPEDSIGNATURES)
@@ -41,32 +41,52 @@ function backward_sampling!(ixs, @nospecialize(xs::Tuple), iy, @nospecialize(y),
     setmask!(samples, eliminated_variables)
 
     # the contraction code to get probability
-    newiy = eliminated_variables
-    iy_in_sample = idx4labels(samples.labels, iy)
-    slice_y_dim = collect(1:length(iy))
     newixs = map(ix->setdiff(ix, iy), ixs)
     ix_in_sample = map(ix->idx4labels(samples.labels, ix ∩ iy), ixs)
     slice_xs_dim = map(ix->idx4labels(ix, ix ∩ iy), ixs)
-    code = DynamicEinCode(newixs, newiy)
+
+    # relabel and compute probabilities
+    uniquelabels = unique!(vcat(ixs..., iy))
+    labelmap = Dict(zip(uniquelabels, 1:length(uniquelabels)))
+    batchdim = length(labelmap) + 1
+    newnewixs = [Int[getindex.(Ref(labelmap), ix)..., batchdim] for ix in newixs]
+    newnewiy = Int[getindex.(Ref(labelmap), eliminated_variables)..., batchdim]
+    newnewxs = [get_slice(x, dimx, samples.samples[ixloc, :]) for (x, dimx, ixloc) in zip(xs, slice_xs_dim, ix_in_sample)]
+    code = DynamicEinCode(newnewixs, newnewiy)
+    probabilities = code(newnewxs...)
 
     totalset = CartesianIndices((map(x->size_dict[x], eliminated_variables)...,))
-    for (i, sample) in enumerate(samples.samples)
-        newxs = [get_slice(x, dimx, sample[ixloc]) for (x, dimx, ixloc) in zip(xs, slice_xs_dim, ix_in_sample)]
-        newy = get_element(y, slice_y_dim, sample[iy_in_sample])
-        probabilities = einsum(code, (newxs...,), size_dict) / newy
-        config = StatsBase.sample(totalset, Weights(vec(probabilities)))
-        # update the samples
-        samples.samples[i][eliminated_locs] .= config.I .- 1
+    for i=axes(samples.samples, 2)
+        config = StatsBase.sample(totalset, Weights(vec(selectdim(probabilities, ndims(probabilities), i))))
+        # update the samplesS
+        samples.samples[eliminated_locs, i] .= config.I .- 1
     end
     return samples
 end
 
 # type unstable
-function get_slice(x, dim, config)
-    asarray(x[[i ∈ dim ? config[findfirst(==(i), dim)]+1 : Colon() for i in 1:ndims(x)]...], x)
+function get_slice(x::AbstractArray{T}, slicedim, configs::AbstractMatrix) where T
+    outdim = setdiff(1:ndims(x), slicedim)
+    res = similar(x, [size(x, d) for d in outdim]..., size(configs, 2))
+    return get_slice!(res, x, outdim, slicedim, configs)
 end
-function get_element(x, dim, config)
-    x[[config[findfirst(==(i), dim)]+1 for i in 1:ndims(x)]...]
+
+function get_slice!(res, x::AbstractArray{T}, outdim, slicedim, configs::AbstractMatrix) where T
+    xstrides = strides(x)
+    @inbounds for ci in CartesianIndices(res)
+        idx = 1
+        # the output dimension part
+        for (dim, k) in zip(outdim, ci.I)
+            idx += (k-1) * xstrides[dim]
+        end
+        # the sliced part
+        batchidx = ci.I[end]
+        for (dim, k) in zip(slicedim, view(configs, :, batchidx))
+            idx += k * xstrides[dim]
+        end
+        res[ci] = x[idx]
+    end
+    return res
 end
 
 """
@@ -79,7 +99,7 @@ Returns a vector of vector, each element being a configurations defined on `get_
 * `tn` is the tensor network model.
 * `n` is the number of samples to be returned.
 """
-function sample(tn::TensorNetworkModel, n::Int; usecuda = false)::Vector{Vector{Int}}
+function sample(tn::TensorNetworkModel, n::Int; usecuda = false)::AbstractMatrix{Int}
     # generate tropical tensors with its elements being log(p).
     xs = adapt_tensors(tn; usecuda, rescale = false)
     # infer size from the contraction code and the input tensors `xs`, returns a label-size dictionary.
@@ -93,21 +113,27 @@ function sample(tn::TensorNetworkModel, n::Int; usecuda = false)::Vector{Vector{
     idx = map(l->findfirst(==(l), labels), iy)
     setmask[idx] .= true
     indices = StatsBase.sample(CartesianIndices(size(cache.content)), Weights(normalize!(vec(LinearAlgebra.normalize!(cache.content)))), n)
-    configs = map(indices) do ind
-        c=zeros(Int, length(labels))
-        c[idx] .= ind.I .- 1
-        c
+    configs = zeros(Int, length(labels), n)
+    for i=1:n
+        configs[idx, i] .= indices[i].I .- 1
     end
     samples = Samples(configs, labels, setmask)
     # back-propagate
     generate_samples(tn.code, cache, samples, size_dict)
+    # set evidence variables
+    for (k, v) in tn.fixedvertices
+        idx = findfirst(==(k), labels)
+        samples.samples[idx, :] .= v
+    end
     return samples.samples
 end
 
 function generate_samples(code::NestedEinsum, cache::CacheTree{T}, samples, size_dict::Dict) where {T}
     if !OMEinsum.isleaf(code)
         xs = ntuple(i -> cache.siblings[i].content, length(cache.siblings))
         backward_sampling!(OMEinsum.getixs(code.eins), xs, OMEinsum.getiy(code.eins), cache.content, samples, size_dict)
-        generate_samples.(code.args, cache.siblings, Ref(samples), Ref(size_dict))
+        for (arg, sib) in zip(code.args, cache.siblings)
+            generate_samples(arg, sib, samples, size_dict)
+        end
     end
 end
diff --git a/test/mmap.jl b/test/mmap.jl
@@ -28,58 +28,4 @@ end
     @debug(mmap3)
     logp, config = most_probable_config(mmap3)
     @test log_probability(mmap3, config) ≈ logp
-end
-
-@testset "sampling" begin
-    instance = TensorInference.read_instance_from_string("""MARKOV
-8
- 2 2 2 2 2 2 2 2
-8
- 1 0
- 2 1 0
- 1 2
- 2 3 2
- 2 4 2
- 3 5 3 1
- 2 6 5
- 3 7 5 4
-
-2
- 0.01
- 0.99
-
-4
- 0.05 0.01
- 0.95 0.99
-
-2
- 0.5
- 0.5
-
-4
- 0.1 0.01
- 0.9 0.99
-
-4
- 0.6 0.3
- 0.4 0.7 
-
-8
- 1 1 1 0
- 0 0 0 1
-
-4
- 0.98 0.05
- 0.02 0.95
-
-8
- 0.9 0.7 0.8 0.1
- 0.1 0.3 0.2 0.9
-""")
-    n = 10000
-    tnet = TensorNetworkModel(instance)
-    samples = sample(tnet, n)
-    mars = getindex.(marginals(tnet), 2)
-    mars_sample = [count(s->s[k]==(1), samples) for k=1:8] ./ n
-    @test isapprox(mars, mars_sample, atol=0.05)
-end
+end
diff --git a/test/runtests.jl b/test/runtests.jl
@@ -1,7 +1,7 @@
 using Test, TensorInference, Documenter, Pkg, Artifacts
 
 import Pkg;
-Pkg.ensure_artifact_installed("uai2014", "Artifacts.toml");
+Pkg.ensure_artifact_installed("uai2014", joinpath(@__DIR__, "Artifacts.toml"));
 
 include("utils.jl")
 
diff --git a/test/sampling.jl b/test/sampling.jl
@@ -0,0 +1,63 @@
+using TensorInference, Test
+
+@testset "sampling" begin
+    instance = TensorInference.read_instance_from_string("""MARKOV
+8
+ 2 2 2 2 2 2 2 2
+8
+ 1 0
+ 2 1 0
+ 1 2
+ 2 3 2
+ 2 4 2
+ 3 5 3 1
+ 2 6 5
+ 3 7 5 4
+
+2
+ 0.01
+ 0.99
+
+4
+ 0.05 0.01
+ 0.95 0.99
+
+2
+ 0.5
+ 0.5
+
+4
+ 0.1 0.01
+ 0.9 0.99
+
+4
+ 0.6 0.3
+ 0.4 0.7 
+
+8
+ 1 1 1 0
+ 0 0 0 1
+
+4
+ 0.98 0.05
+ 0.02 0.95
+
+8
+ 0.9 0.7 0.8 0.1
+ 0.1 0.3 0.2 0.9
+""")
+    n = 10000
+    tnet = TensorNetworkModel(instance)
+    samples = sample(tnet, n)
+    mars = getindex.(marginals(tnet), 2)
+    mars_sample = [count(i->samples[k, i]==(1), axes(samples, 2)) for k=1:8] ./ n
+    @test isapprox(mars, mars_sample, atol=0.05)
+
+    # fix the evidence
+    set_evidence!(instance, 7=>1)
+    tnet = TensorNetworkModel(instance)
+    samples = sample(tnet, n)
+    mars = getindex.(marginals(tnet), 1)
+    mars_sample = [count(i->samples[k, i]==(0), axes(samples, 2)) for k=1:8] ./ n
+    @test isapprox([mars[1:6]..., mars[8]], [mars_sample[1:6]..., mars_sample[8]], atol=0.05)
+end