clean up

GiggleLiu · GiggleLiu · commit 8295474fbec1 · 2025-05-05T17:44:35.000+08:00
diff --git a/Project.toml b/Project.toml
@@ -4,7 +4,6 @@ authors = ["Jin-Guo Liu", "Martin Roa Villescas"]
 version = "0.5.0"
 
 [deps]
-Artifacts = "56f22d72-fd6d-98f1-02f0-08ddc0907c33"
 DocStringExtensions = "ffbed154-4ef7-542d-bbb7-c09d3a79fcae"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 OMEinsum = "ebe7aa44-baf0-506c-a96f-8464559b3922"
@@ -21,11 +20,10 @@ CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
 TensorInferenceCUDAExt = "CUDA"
 
 [compat]
-Artifacts = "1"
 CUDA = "4, 5"
 DocStringExtensions = "0.8.6, 0.9"
 LinearAlgebra = "1"
-OMEinsum = "0.8"
+OMEinsum = "0.8.7"
 Pkg = "1"
 PrettyTables = "2"
 ProblemReductions = "0.3"
diff --git a/ext/TensorInferenceCUDAExt.jl b/ext/TensorInferenceCUDAExt.jl
@@ -1,17 +1,14 @@
 module TensorInferenceCUDAExt
 using CUDA: CuArray
 import CUDA
-import TensorInference: match_arraytype, keep_only!, onehot_like, togpu
+import TensorInference: keep_only!, onehot_like, togpu
 
 function onehot_like(A::CuArray, j)
     mask = zero(A)
     CUDA.@allowscalar mask[j] = one(eltype(mask))
     return mask
 end
 
-# NOTE: this interface should be in OMEinsum
-match_arraytype(::Type{<:CuArray{T, N}}, target::AbstractArray{T, N}) where {T, N} = CuArray(target)
-
 function keep_only!(x::CuArray{T}, j) where T
     CUDA.@allowscalar hotvalue = x[j]
     fill!(x, zero(T))
diff --git a/src/Core.jl b/src/Core.jl
@@ -190,7 +190,4 @@ Returns the contraction complexity of a tensor newtork model.
 """
 function OMEinsum.contraction_complexity(tn::TensorNetworkModel)
     return contraction_complexity(tn.code, Dict(zip(get_vars(tn), get_cards(tn; fixedisone = true))))
-end
-
-# adapt array type with the target array type
-match_arraytype(::Type{<:Array{T, N}}, target::AbstractArray{T, N}) where {T, N} = Array(target)
+end
diff --git a/src/RescaledArray.jl b/src/RescaledArray.jl
@@ -46,4 +46,9 @@ end
 Base.size(arr::RescaledArray) = size(arr.normalized_value)
 Base.size(arr::RescaledArray, i::Int) = size(arr.normalized_value, i)
 
-match_arraytype(::Type{<:RescaledArray{T, N, AT}}, target::AbstractArray{T, N}) where {T, N, AT} = rescale_array(match_arraytype(AT, target))
+function OMEinsum.get_output_array(xs::NTuple{N, RescaledArray{T}}, size, fillzero::Bool) where {N, T}
+    return RescaledArray(zero(T), OMEinsum.get_output_array(getfield.(xs, :normalized_value), size, fillzero))
+end
+# The following two APIs are required by OMEinsum
+Base.fill!(r::RescaledArray, x) = (fill!(r.normalized_value, x ./ exp(r.log_factor)); r)
+Base.conj(r::RescaledArray) = RescaledArray(conj(r.log_factor), conj(r.normalized_value))
diff --git a/src/TensorInference.jl b/src/TensorInference.jl
@@ -8,6 +8,7 @@ $(EXPORTS)
 module TensorInference
 
 using OMEinsum, LinearAlgebra
+using OMEinsum: CacheTree, cached_einsum
 using DocStringExtensions, TropicalNumbers
 # The Tropical GEMM support
 using StatsBase
diff --git a/src/belief.jl b/src/belief.jl
@@ -79,7 +79,7 @@ function _collect_message!(vectors_out::Vector, t::AbstractArray, vectors_in::Ve
     @assert length(vectors_out) == length(vectors_in) == ndims(t) "dimensions mismatch: $(length(vectors_out)), $(length(vectors_in)), $(ndims(t))"
     # TODO: speed up if needed!
     code = star_code(length(vectors_in))
-    cost, gradient = cost_and_gradient(code, [t, vectors_in...])
+    cost, gradient = cost_and_gradient(code, (t, vectors_in...))
     for (o, g) in zip(vectors_out, gradient[2:end])
         o .= g
     end
diff --git a/src/map.jl b/src/map.jl
@@ -2,7 +2,7 @@
 
 ########### Backward tropical tensor contraction ##############
 # This part is copied from [`GenericTensorNetworks`](https://github.com/QuEraComputing/GenericTensorNetworks.jl).
-function einsum_backward_rule(eins, xs::NTuple{M, AbstractArray{<:Tropical}} where {M}, y, size_dict, dy)
+function OMEinsum.einsum_backward_rule(eins, xs::NTuple{M, AbstractArray{<:Tropical}} where {M}, y, size_dict, dy)
     return backward_tropical!(OMEinsum.getixs(eins), xs, OMEinsum.getiy(eins), y, dy, size_dict)
 end
 
@@ -55,7 +55,7 @@ Returns the largest log-probability and the most probable configuration.
 function most_probable_config(tn::TensorNetworkModel; usecuda = false)::Tuple{Real, Vector}
     tensor_indices = check_queryvars(tn, [[v] for v in 1:tn.nvars])
     tensors = map(t -> Tropical.(log.(t)), adapt_tensors(tn; usecuda, rescale = false))
-    logp, grads = cost_and_gradient(tn.code, tensors)
+    logp, grads = cost_and_gradient(tn.code, (tensors...,))
     # use Array to convert CuArray to CPU arrays
     return content(Array(logp)[]), map(k -> haskey(tn.evidence, k) ? tn.evidence[k] : argmax(grads[tensor_indices[k]]) - 1, 1:tn.nvars)
 end
diff --git a/src/mar.jl b/src/mar.jl
@@ -12,115 +12,6 @@ function adapt_tensors(code, tensors, evidence; usecuda, rescale)
     end
 end
 
-# ######### Inference by back propagation ############
-# `CacheTree` stores intermediate `NestedEinsum` contraction results.
-# It is a tree structure that isomorphic to the contraction tree,
-# `content` is the cached intermediate contraction result.
-# `children` are the children of current node, e.g. tensors that are contracted to get `content`.
-mutable struct CacheTree{T}
-    content::AbstractArray{T}
-    const children::Vector{CacheTree{T}}
-end
-
-function cached_einsum(se::SlicedEinsum, @nospecialize(xs), size_dict)
-    # slicing is not supported yet.
-    if length(se.slicing) != 0
-        @warn "Slicing is not supported for caching, got nslices = $(length(se.slicing))! Fallback to `NestedEinsum`."
-    end
-    return cached_einsum(se.eins, xs, size_dict)
-end
-
-# recursively contract and cache a tensor network
-function cached_einsum(code::NestedEinsum, @nospecialize(xs), size_dict)
-    if OMEinsum.isleaf(code)
-        # For a leaf node, cache the input tensor
-        y = xs[code.tensorindex]
-        return CacheTree(y, CacheTree{eltype(y)}[])
-    else
-        # For a non-leaf node, compute the einsum and cache the contraction result
-        caches = [cached_einsum(arg, xs, size_dict) for arg in code.args]
-        # `einsum` evaluates the einsum contraction,
-        # Its 1st argument is the contraction pattern,
-        # Its 2nd one is a tuple of input tensors,
-        # Its 3rd argument is the size dictionary (label as the key, size as the value).
-        y = einsum(code.eins, ntuple(i -> caches[i].content, length(caches)), size_dict)
-        return CacheTree(y, caches)
-    end
-end
-
-# computed gradient tree by back propagation
-function generate_gradient_tree(se::SlicedEinsum, cache::CacheTree{T}, dy::AbstractArray{T}, size_dict::Dict) where {T}
-    if length(se.slicing) != 0
-        @warn "Slicing is not supported for generating masked tree! Fallback to `NestedEinsum`."
-    end
-    return generate_gradient_tree(se.eins, cache, dy, size_dict)
-end
-
-# recursively compute the gradients and store it into a tree.
-# also known as the back-propagation algorithm.
-function generate_gradient_tree(code::NestedEinsum, cache::CacheTree{T}, dy::AbstractArray{T}, size_dict::Dict) where {T}
-    if OMEinsum.isleaf(code)
-        return CacheTree(dy, CacheTree{T}[])
-    else
-        xs = ntuple(i -> cache.children[i].content, length(cache.children))
-        # `einsum_grad` is the back-propagation rule for einsum function.
-        # If the forward pass is `y = einsum(EinCode(inputs_labels, output_labels), (A, B, ...), size_dict)`
-        # Then the back-propagation pass is
-        # ```
-        # A̅ = einsum_grad(inputs_labels, (A, B, ...), output_labels, size_dict, y̅, 1)
-        # B̅ = einsum_grad(inputs_labels, (A, B, ...), output_labels, size_dict, y̅, 2)
-        # ...
-        # ```
-        # Let `L` be the loss, we will have `y̅ := ∂L/∂y`, `A̅ := ∂L/∂A`...
-        dxs = einsum_backward_rule(code.eins, xs, cache.content, size_dict, dy)
-        return CacheTree(dy, generate_gradient_tree.(code.args, cache.children, dxs, Ref(size_dict)))
-    end
-end
-
-# a unified interface of the backward rules for real numbers and tropical numbers
-function einsum_backward_rule(eins, xs::NTuple{M, AbstractArray{<:Real}} where {M}, y, size_dict, dy)
-    return ntuple(i -> OMEinsum.einsum_grad(OMEinsum.getixs(eins), xs, OMEinsum.getiy(eins), size_dict, dy, i), length(xs))
-end
-
-# the main function for generating the gradient tree.
-function gradient_tree(code, xs)
-    # infer size from the contraction code and the input tensors `xs`, returns a label-size dictionary.
-    size_dict = OMEinsum.get_size_dict!(getixsv(code), xs, Dict{Int, Int}())
-    # forward compute and cache intermediate results.
-    cache = cached_einsum(code, xs, size_dict)
-    # initialize `y̅` as `1`. Note we always start from `L̅ := 1`.
-    dy = match_arraytype(typeof(cache.content), ones(eltype(cache.content), size(cache.content)))
-    # back-propagate
-    return copy(cache.content), generate_gradient_tree(code, cache, dy, size_dict)
-end
-
-# evaluate the cost and the gradient of leaves
-function cost_and_gradient(code, xs)
-    cost, tree = gradient_tree(code, xs)
-    # extract the gradients on leaves (i.e. the input tensors).
-    return cost, extract_leaves(code, tree)
-end
-
-# since slicing is not supported, we forward it to NestedEinsum.
-extract_leaves(code::SlicedEinsum, cache::CacheTree) = extract_leaves(code.eins, cache)
-
-# extract gradients on leaf nodes.
-function extract_leaves(code::NestedEinsum, cache::CacheTree)
-    res = Vector{Any}(undef, length(getixsv(code)))
-    return extract_leaves!(code, cache, res)
-end
-
-function extract_leaves!(code, cache, res)
-    if OMEinsum.isleaf(code)
-        # extract
-        res[code.tensorindex] = cache.content
-    else
-        # resurse deeper
-        extract_leaves!.(code.args, cache.children, Ref(res))
-    end
-    return res
-end
-
 """
 $(TYPEDSIGNATURES)
 
@@ -186,7 +77,7 @@ probabilities of the queried variables, represented by tensors.
 """
 function marginals(tn::TensorNetworkModel; usecuda = false, rescale = true)::Dict{Vector{Int}}
     # sometimes, the cost can overflow, then we need to rescale the tensors during contraction.
-    cost, grads = cost_and_gradient(tn.code, adapt_tensors(tn; usecuda, rescale))
+    cost, grads = cost_and_gradient(tn.code, (adapt_tensors(tn; usecuda, rescale)...,))
     @debug "cost = $cost"
     ixs = OMEinsum.getixsv(tn.code)
     queryvars = ixs[tn.unity_tensors_idx]
diff --git a/src/mmap.jl b/src/mmap.jl
@@ -178,7 +178,7 @@ end
 function most_probable_config(mmap::MMAPModel; usecuda = false)::Tuple{Real, Vector}
     vars = get_vars(mmap)
     tensors = map(t -> OMEinsum.asarray(Tropical.(log.(t)), t), adapt_tensors(mmap; usecuda, rescale = false))
-    logp, grads = cost_and_gradient(mmap.code, tensors)
+    logp, grads = cost_and_gradient(mmap.code, (tensors...,))
     # use Array to convert CuArray to CPU arrays
     return content(Array(logp)[]), map(k -> haskey(mmap.evidence, vars[k]) ? mmap.evidence[vars[k]] : argmax(grads[k]) - 1, 1:length(vars))
 end
diff --git a/src/sampling.jl b/src/sampling.jl
@@ -134,9 +134,9 @@ function generate_samples!(code::DynamicNestedEinsum, cache::CacheTree{T}, iy_en
     @assert length(iy_env) == ndims(env)
     if !(OMEinsum.isleaf(code))
         ixs, iy = getixsv(code.eins), getiyv(code.eins)
-        for (subcode, child, ix) in zip(code.args, cache.children, ixs)
+        for (subcode, child, ix) in zip(code.args, cache.siblings, ixs)
             # subenv for the current child, use it to sample and update its cache
-            siblings = filter(x->x !== child, cache.children)
+            siblings = filter(x->x !== child, cache.siblings)
             siblings_ixs = filter(x->x !== ix, ixs)
             iy_subenv = batch_label ∈ ix ? ix : [ix..., batch_label]
             envcode = optimize_code(EinCode([siblings_ixs..., iy_env], iy_subenv), size_dict, GreedyMethod(; nrepeat=1))
@@ -184,12 +184,12 @@ end
 function udpate_cache_tree!(ne::NestedEinsum, cache::CacheTree{T}, el::Pair{<:AbstractVector{L}}, batch_label::L, size_dict::Dict{L}) where {T, L}
     OMEinsum.isleaf(ne) && return
     updated = false
-    for (subcode, child, ix) in zip(ne.args, cache.children, getixsv(ne.eins))
+    for (subcode, child, ix) in zip(ne.args, cache.siblings, getixsv(ne.eins))
         if any(x->x ∈ el.first, ix)
             updated = true
             child.content = _eliminate!(child.content, ix, el, batch_label)
             udpate_cache_tree!(subcode, child, el, batch_label, size_dict)
         end
     end
-    updated && (cache.content = einsum(ne.eins, (getfield.(cache.children, :content)...,), size_dict))
+    updated && (cache.content = einsum(ne.eins, (getfield.(cache.siblings, :content)...,), size_dict))
 end
diff --git a/test/map.jl b/test/map.jl
@@ -20,8 +20,7 @@ end
         evidence=read_evidence(model),
         optimizer = TreeSA(ntrials = 3, niters = 2, βs = 1:0.1:80))
     @debug contraction_complexity(tn)
-    most_probable_config(tn)
-    @time logp, config = most_probable_config(tn)
+    logp, config = most_probable_config(tn)
     @test log_probability(tn, config) ≈ logp
     @test maximum_logp(tn)[] ≈ logp
 end
diff --git a/test/mar.jl b/test/mar.jl
@@ -8,6 +8,13 @@ using TensorInference
     op = ein"ij, j -> i"
     @test Array(x) ≈ exp(2.0) .* [2.0, 3.0]
     @test op(Array(A), Array(x)) ≈ Array(op(A, x))
+
+    @test OMEinsum.get_output_array((A,), (2,), true) ≈ RescaledArray(0.0, [0.0, 0.0])
+    @test fill!(RescaledArray(0.0, [0.0, 0.0]), 5.0) ≈ [5.0, 5.0]
+
+    C = RescaledArray(2.0 + 1im, [2.0im 3.0; 5.0 6.0])
+    @test conj(C) isa RescaledArray
+    @test conj(C) ≈ RescaledArray(2.0 - 1im, [-2.0im 3.0; 5.0 6.0])
 end
 
 @testset "cached, rescaled contract" begin
@@ -23,12 +30,12 @@ end
     # cached contract
     xs = TensorInference.adapt_tensors(tn; usecuda = false, rescale = true)
     size_dict = OMEinsum.get_size_dict!(getixsv(tn.code), xs, Dict{Int, Int}())
-    cache = TensorInference.cached_einsum(tn.code, xs, size_dict)
+    cache = OMEinsum.cached_einsum(tn.code, xs, size_dict)
     @test cache.content isa RescaledArray
     @test Array(cache.content) ≈ p1
 
     # compute marginals
-    ti_sol = marginals(tn)
+    ti_sol = marginals(tn; rescale = true)
     ref_sol[collect(keys(evidence))] .= fill([1.0], length(evidence)) # imitate dummy vars
     @test isapprox([ti_sol[[i]] for i=1:length(ref_sol)], ref_sol; atol = 1e-5)
 end