Merge branch 'fix_infer_dicttype' of /~https://github.com/reactivebayes…

…/RxInfer.jl into fix_infer_dicttype
ReactiveBayes · Feb 22, 2024 · 9cd0d84 · 9cd0d84
2 parents 45b1d6e + 0dca5e2
commit 9cd0d84
Show file tree

Hide file tree

Showing 5 changed files with 147 additions and 8 deletions.
diff --git a/.github/workflows/CI.yml b/.github/workflows/CI.yml
@@ -57,7 +57,7 @@ jobs:
         arch:
           - x64
     steps:
-      - uses: actions/checkout@v2
+      - uses: actions/checkout@v4
       - uses: julia-actions/setup-julia@v1
       - uses: julia-actions/cache@v1
       - uses: julia-actions/julia-buildpkg@v1

diff --git a/Makefile b/Makefile
@@ -37,7 +37,7 @@ format: scripts_init ## Code formating run
 
 examples_init:
 	$(RM) $(EXAMPLES_MANIFEST_FILE)
-	julia --startup-file=no --project=examples/ -e 'using Pkg; Pkg.develop(PackageSpec(path=pwd())); Pkg.instantiate(); Pkg.precompile();'
+	julia --startup-file=no --project=examples/ -e 'using Pkg; Pkg.develop(PackageSpec(path=pwd())); Pkg.instantiate(); Pkg.build(); Pkg.precompile();'
 
 dev_examples_init:
 	$(RM) $(EXAMPLES_MANIFEST_FILE)

diff --git a/docs/make.jl b/docs/make.jl
@@ -50,9 +50,7 @@ end
 
 # Create an array of pages for each category
 ExamplesCategoriesPages = map(collect(pairs(ExamplesCategories))) do (label, category)
-    return label => (title = category.title, pages = [
-        "Overview" => joinpath("examples", string(label), "overview.md")
-    ])
+    return label => (title = category.title, pages = ["Overview" => joinpath("examples", string(label), "overview.md")])
 end |> NamedTuple
 
 # The `pages` argument in the `makedocs` needs only a short path, so we ignore the full path
@@ -69,6 +67,7 @@ end
 foreach(vcat(ExamplesOverviewPath, ExamplesCategoriesOverviewPaths)) do path
     if !isfile(path)
         @warn "`$(path)` does not exist. Generating an empty overview. Use the `make examples` command to generate the overview and all examples."
+        mkpath(dirname(path))
         open(path, "w") do f
             write(f, "The overview is missing. Use the `make examples` command to generate the overview and all examples.")
         end
@@ -117,6 +116,7 @@ makedocs(;
             "Meta specification"        => "manuals/meta-specification.md",
             "Inference specification"   => ["Overview" => "manuals/inference/overview.md", "Static vs Streamline inference" => "manuals/inference/infer.md", "Inference results postprocessing" => "manuals/inference/postprocess.md", "Manual inference specification" => "manuals/inference/manual.md"],
             "Inference customization"   => ["Defining a custom node and rules" => "manuals/custom-node.md"],
+            "Messages initialization"   => "manuals/understanding-why-to-initialize-messages.md",
             "Debugging"                 => "manuals/debugging.md",
             "Delta node"                => "manuals/delta-node.md"
         ],
@@ -131,10 +131,10 @@ makedocs(;
             ExamplesPages...
         ],
         "Contributing" => [
-            "Overview" => "contributing/overview.md", 
+            "Overview" => "contributing/overview.md",
             "Contributing to the documentation" => "contributing/new-documentation.md",
-            "Contributing to the dependencies" => "contributing/new-package.md", 
-            "Contributing to the examples" => "contributing/new-example.md", 
+            "Contributing to the dependencies" => "contributing/new-package.md",
+            "Contributing to the examples" => "contributing/new-example.md",
             "Publishing a new release" => "contributing/new-release.md"
         ]
     ]

diff --git a/docs/src/assets/img/linear_regresion_model.png b/docs/src/assets/img/linear_regresion_model.png
diff --git a/docs/src/manuals/understanding-why-to-initialize-messages.md b/docs/src/manuals/understanding-why-to-initialize-messages.md
@@ -0,0 +1,139 @@
+# Understating why we need to initialize messages in RxInfer
+
+In certain models, after completing the model specification step and moving on to execute the inference procedure, you may encounter an error prompting you to _initialize required marginals and messages_. Understanding why this step is necessary can be perplexing. This tutorial is designed to delve into the intuition behind model initialization using a practical example.
+
+
+## Part 1. Framing the problem 
+
+John has recently acquired a new car and is keenly interested in its `fuel consumption` rate. He holds the belief that this rate follows a linear relationship with the variable `speed`. To validate this hypothesis, he plans to conduct tests by driving his car on the urban roads close to his home, recording both the `fuel consumption` and `speed` data. To ascertain the fuel consumption rate, John has opted for Bayesian linear regression as his analytical method.
+
+```@example init-tutorial
+using Random, Plots, StableRNGs
+
+function generate_data(a, b, v, nr_samples; rng = StableRNG(1234))
+    x = float.(collect(1:nr_samples))
+    y = a .* x .+ b .+ randn(rng, nr_samples) .* sqrt(v)
+    return x, y
+end;
+
+# For demonstration purposes we generate some fake data 
+x_data, y_data = generate_data(0.5, 25.0, 1.0, 250)
+
+scatter(x_data, y_data, title = "Dataset (City road)", legend=false)
+xlabel!("Speed")
+ylabel!("Fuel consumption")
+```
+
+
+### Univariate regression with known noise
+
+First, he drives the car on a urban road. John enjoys driving on the well-built, wide, and flat urban roads. Urban roads also offer the advantage of precise fuel consumption measurement with minimal noise. Therefore John models the fuel consumption $y_n\in\mathbb{R}$ as a normal distribution and treats $x_n$ as a fixed hyper-parameter:
+
+$$\begin{aligned}
+p(y_n \mid a, b) = \mathcal{N}(y_n \mid a x_n + b , 1)
+\end{aligned}$$
+
+The recorded speed is denoted as $x_n \in \mathbb{R}$ and the recorded fuel consumption as $y_n \in \mathbb{R}$. Prior beliefs on $a$ and $b$ are informed by the vehicle manual.
+
+$$\begin{aligned}
+    p(a) &= \mathcal{N}(a \mid m_a, v_a) \\
+    p(b) &= \mathcal{N}(b \mid m_b, v_b) 
+\end{aligned}$$
+
+Together they form the probabilistic model
+$$p(y, a, b) = p(a)p(b) \prod_{N=1}^N p(y_n \mid a, b),$$
+where the goal is to infer the posterior distributions $p(a \mid y)$ and $p(b\mid y)$.
+
+In order to estimate the two parameters with the recorded data, he uses a `RxInfer.jl` to create the above described model.
+
+```@example init-tutorial
+using RxInfer
+
+@model function linear_regression(nr_samples)
+    a ~ Normal(mean = 0.0, variance = 1.0)
+    b ~ Normal(mean = 0.0, variance = 100.0)
+    
+    x = datavar(Float64, nr_samples)
+    y = datavar(Float64, nr_samples)
+    
+    y .~ Normal(mean = a .* x .+ b, variance = 1.0)
+end
+```
+
+Delighted with the convenience offered by the package's inference function ([`infer`](@ref)), he appreciates the time saved from building everything from the ground up. This feature allows him to effortlessly obtain the desired results for his specific road. Upon consulting the documentation, he proceeds to run the inference function.
+
+```julia
+results = infer(
+    model        = linear_regression(length(x_data)), 
+    data         = (y = y_data, x = x_data), 
+    returnvars   = (a = KeepLast(), b = KeepLast()),
+    iterations   = 20,
+    free_energy  = true
+)
+```
+
+Oeps! Exception?
+
+```
+exception =
+│    Variables [ a, b ] have not been updated after an update event. 
+│    Therefore, make sure to initialize all required marginals and messages. See `initmarginals` and `initmessages` keyword arguments for the inference function. 
+│    See the function documentation for detailed information regarding the initialization.
+```
+
+After running the inference procedure an error appears, which prompts him to _initialize all required messages and marginals_. Now, John is left pondering the reason behind this requirement. Why is it necessary? Should he indeed initialize all messages and marginals? And if so, how might this impact the inference procedure?
+
+## Part 2. Why and What to initialize
+
+Before delving too deeply into the details, it's important to understand that RxInfer constructs a factorized representation of your model using a Forney Style Factor Graph (FFG). In this structure, inference is executed through message passing.
+
+A challenge arises when RxInfer generates the FFG representation with structural loops in certain parts of the graph. These loops indicate that a message or marginal within the loop depends not only on its prior but also on itself. Consequently, proper initialization is crucial for initiating the inference process. Two general rules of thumb guide this initialization, although the intricate details are beyond the scope of this tutorial:
+
+1.	Initiate as few messages/marginals as possible when dealing with a loop structure, it will be more efficient and accurate.
+2.	Prioritize initializing marginals over messages.
+
+**How to identify and handle the loops?**
+
+Identifying loops is currently a manual process, as the current version of RxInfer doesn't support a graphical representation of the created graph. As such, the manual process involves:
+
+1.	Deriving the graphical representation of the model,
+2.	Identifying loops and the messages or marginals that need to be initialized within the loop.
+
+However, once you receive the message `Variables [x, y, z] have not been updated after an update event`, it is a good indication that there is a loop in your model. If you see this message, you should check your model for loops and try to initialize the messages and/or marginals that are part of the loop.
+
+### Deriving FFG and identifying the loops
+
+John proceeds to derive the FFG for his problem where he identifies where the loops are:
+
+![Addons_messages](../assets/img/linear_regresion_model.png)
+
+He does note that there is a loop in his model, namely all $a$ and $b$ variables are connected over all observations, therefore he needs to initialize one of the messages and run multiple iterations for the loopy belief propagation algorithm. It is worth noting that loopy belief propagation is not guaranteed to converge in general and might be highly influenced by the choice of the initial messages in the `initmessages` argument. He is going to evaluate the convergency performance of the algorithm with the `free_energy = true` option:
+
+
+```@example init-tutorial
+results = infer(
+    model        = linear_regression(length(x_data)), 
+    data         = (y = y_data, x = x_data), 
+    initmessages = (b = NormalMeanVariance(0.0, 100.0), ), 
+    returnvars   = (a = KeepLast(), b = KeepLast()),
+    iterations   = 20,
+    free_energy  = true
+)
+
+# drop first iteration, which is influenced by the `initmessages`
+plot(2:20, results.free_energy[2:end], title="Free energy", xlabel="Iteration", ylabel="Free energy [nats]", legend=false)
+```
+
+Now the inference runs without the error! 🎉
+
+```@example init-tutorial
+as = rand(results.posteriors[:a], 100)
+bs = rand(results.posteriors[:b], 100)
+p = scatter(x_data, y_data, title = "Linear regression with more noise", legend=false)
+xlabel!("Speed")
+ylabel!("Fuel consumption")
+for (a, b) in zip(as, bs)
+    global p = plot!(p, x_data, a .* x_data .+ b, alpha = 0.05, color = :red)
+end
+plot(p, size = (900, 400))
+```