TuringLang
diff --git a/‎HISTORY.md‎
Lines changed: 20 additions & 4 deletions b/‎HISTORY.md‎
Lines changed: 20 additions & 4 deletions
diff --git a/‎README.md‎
Lines changed: 26 additions & 17 deletions b/‎README.md‎
Lines changed: 26 additions & 17 deletions
diff --git a/‎docs/src/api.md‎
Lines changed: 1 addition & 0 deletions b/‎docs/src/api.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/Turing.jl‎
Lines changed: 1 addition & 0 deletions b/‎src/Turing.jl‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/mcmc/Inference.jl‎
Lines changed: 2 additions & 0 deletions b/‎src/mcmc/Inference.jl‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/mcmc/abstractmcmc.jl‎
Lines changed: 1 addition & 0 deletions b/‎src/mcmc/abstractmcmc.jl‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/mcmc/gibbs_conditional.jl‎
Lines changed: 171 additions & 0 deletions b/‎src/mcmc/gibbs_conditional.jl‎
Lines changed: 171 additions & 0 deletions
diff --git a/‎src/mcmc/hmc.jl‎
Lines changed: 6 additions & 4 deletions b/‎src/mcmc/hmc.jl‎
Lines changed: 6 additions & 4 deletions
diff --git a/‎test/Project.toml‎
Lines changed: 1 addition & 0 deletions b/‎test/Project.toml‎
Lines changed: 1 addition & 0 deletions
@@ -8,16 +8,32 @@ This is because the interface functions required have been shifted upstream to A
 
 In particular, you now only need to define the following functions:
 
-  - AbstractMCMC.step(rng::Random.AbstractRNG, model::AbstractMCMC.LogDensityModel, ::MySampler; kwargs...) (and also a method with `state`, and the corresponding `step_warmup` methods if needed)
-  - AbstractMCMC.getparams(::MySamplerState)               -> Vector{<:Real}
-  - AbstractMCMC.getstats(::MySamplerState)                -> NamedTuple
-  - AbstractMCMC.requires_unconstrained_space(::MySampler) -> Bool (default `true`)
+  - `AbstractMCMC.step(rng::Random.AbstractRNG, model::AbstractMCMC.LogDensityModel, ::MySampler; kwargs...)` (and also a method with `state`, and the corresponding `step_warmup` methods if needed)
+  - `AbstractMCMC.getparams(::MySamplerState)`               -> Vector{<:Real}
+  - `AbstractMCMC.getstats(::MySamplerState)`                -> NamedTuple
+  - `AbstractMCMC.requires_unconstrained_space(::MySampler)` -> Bool (default `true`)
 
 This means that you only need to depend on AbstractMCMC.jl.
 As long as the above functions are defined correctly, Turing will be able to use your external sampler.
 
 The `Turing.Inference.isgibbscomponent(::MySampler)` interface function still exists, but in this version the default has been changed to `true`, so you should not need to overload this.
 
+# 0.41.4
+
+Fixed a bug where the `check_model=false` keyword argument would not be respected when sampling with multiple threads or cores.
+
+# 0.41.3
+
+Fixed NUTS not correctly specifying the number of adaptation steps when calling `AdvancedHMC.initialize!` (this bug led to mass matrix adaptation not actually happening).
+
+# 0.41.2
+
+Add `GibbsConditional`, a "sampler" that can be used to provide analytically known conditional posteriors in a Gibbs sampler.
+
+In Gibbs sampling, some variables are sampled with a component sampler, while holding other variables conditioned to their current values. Usually one e.g. takes turns sampling one variable with HMC and the other with a particle sampler. However, sometimes the posterior distribution of one variable is known analytically, given the conditioned values of other variables. `GibbsConditional` provides a way to implement these analytically known conditional posteriors and use them as component samplers for Gibbs. See the docstring of `GibbsConditional` for details.
+
+Note that `GibbsConditional` used to exist in Turing.jl until v0.36, at which it was removed when the whole Gibbs sampler was rewritten. This reintroduces the same functionality, though with a slightly different interface.
+
 # 0.41.1
 
 The `ModeResult` struct returned by `maximum_a_posteriori` and `maximum_likelihood` can now be wrapped in `InitFromParams()`.
 
@@ -1,6 +1,10 @@
-<p align="center"><img src="https://raw.githubusercontent.com/TuringLang/turinglang.github.io/refs/heads/main/assets/logo/turing-logo.svg" alt="Turing.jl logo" width="200" /></p>
-<h1 align="center">Turing.jl</h1>
-<p align="center"><i>Probabilistic programming and Bayesian inference in Julia</i></p>
+<p align="center">
+  <picture>
+    <source media="(prefers-color-scheme: dark)" srcset="https://turinglang.org/assets/logo/turing-logo-dark.svg">
+    <img src="https://turinglang.org/assets/logo/turing-logo-light.svg" alt="Turing.jl logo" width="300">
+  </picture>
+</p>
+<p align="center"><i>Bayesian inference with probabilistic programming</i></p>
 <p align="center">
 <a href="https://turinglang.org/"><img src="https://img.shields.io/badge/docs-tutorials-blue.svg" alt="Tutorials" /></a>
 <a href="https://turinglang.org/Turing.jl/stable"><img src="https://img.shields.io/badge/docs-API-blue.svg" alt="API docs" /></a>
@@ -9,9 +13,9 @@
 <a href="https://github.com/SciML/ColPrac"><img src="https://img.shields.io/badge/ColPrac-Contributor%27s%20Guide-blueviolet" alt="ColPrac: Contributor's Guide on Collaborative Practices for Community Packages" /></a>
 </p>
 
-## 🚀 Get started
+## Get started
 
-Install Julia (see [the official Julia website](https://julialang.org/install/); you will need at least Julia 1.10 for the latest version of Turing.jl).
+Install Julia (see [the official Julia website](https://julialang.org/install/); you will need at least Julia 1.10.8 for the latest version of Turing.jl).
 Then, launch a Julia REPL and run:
 
 ```julia
@@ -23,22 +27,29 @@ You can define models using the `@model` macro, and then perform Markov chain Mo
 ```julia
 julia> using Turing
 
-julia> @model function my_first_model(data)
-           mean ~ Normal(0, 1)
-           sd ~ truncated(Cauchy(0, 3); lower=0)
-           data ~ Normal(mean, sd)
+julia> @model function linear_regression(x)
+           # Priors
+           α ~ Normal(0, 1)
+           β ~ Normal(0, 1)
+           σ² ~ truncated(Cauchy(0, 3); lower=0)
+
+           # Likelihood
+           μ = α .+ β .* x
+           y ~ MvNormal(μ, σ² * I)
        end
 
-julia> model = my_first_model(randn())
+julia> x, y = rand(10), rand(10)
 
-julia> chain = sample(model, NUTS(), 1000)
+julia> posterior = linear_regression(x) | (; y = y)
+
+julia> chain = sample(posterior, NUTS(), 1000)
 ```
 
 You can find the main TuringLang documentation at [**https://turinglang.org**](https://turinglang.org), which contains general information about Turing.jl's features, as well as a variety of tutorials with examples of Turing.jl models.
 
 API documentation for Turing.jl is specifically available at [**https://turinglang.org/Turing.jl/stable**](https://turinglang.org/Turing.jl/stable/).
 
-## 🛠️ Contributing
+## Contributing
 
 ### Issues
 
@@ -55,20 +66,20 @@ Breaking releases (minor version) should target the `breaking` branch.
 
 If you have not received any feedback on an issue or PR for a while, please feel free to ping `@TuringLang/maintainers` in a comment.
 
-## 💬 Other channels
+## Other channels
 
 The Turing.jl userbase tends to be most active on the [`#turing` channel of Julia Slack](https://julialang.slack.com/archives/CCYDC34A0).
 If you do not have an invitation to Julia's Slack, you can get one from [the official Julia website](https://julialang.org/slack/).
 
 There are also often threads on [Julia Discourse](https://discourse.julialang.org) (you can search using, e.g., [the `turing` tag](https://discourse.julialang.org/tag/turing)).
 
-## 🔄 What's changed recently?
+## What's changed recently?
 
 We publish a fortnightly newsletter summarising recent updates in the TuringLang ecosystem, which you can view on [our website](https://turinglang.org/news/), [GitHub](https://github.com/TuringLang/Turing.jl/issues/2498), or [Julia Slack](https://julialang.slack.com/archives/CCYDC34A0).
 
 For Turing.jl specifically, you can see a full changelog in [`HISTORY.md`](https://github.com/TuringLang/Turing.jl/blob/main/HISTORY.md) or [our GitHub releases](https://github.com/TuringLang/Turing.jl/releases).
 
-## 🧩 Where does Turing.jl sit in the TuringLang ecosystem?
+## Where does Turing.jl sit in the TuringLang ecosystem?
 
 Turing.jl is the main entry point for users, and seeks to provide a unified, convenient interface to all of the functionality in the TuringLang (and broader Julia) ecosystem.
 
@@ -125,5 +136,3 @@ month = feb,
 ```
 
 </details>
-
-You can see the full list of publications that have cited Turing.jl on [Google Scholar](https://scholar.google.com/scholar?cites=11803241473159708991).
 
@@ -63,6 +63,7 @@ even though [`Prior()`](@ref) is actually defined in the `Turing.Inference` modu
 | `Emcee`              | [`Turing.Inference.Emcee`](@ref)              | Affine-invariant ensemble sampler                                   |
 | `ESS`                | [`Turing.Inference.ESS`](@ref)                | Elliptical slice sampling                                           |
 | `Gibbs`              | [`Turing.Inference.Gibbs`](@ref)              | Gibbs sampling                                                      |
+| `GibbsConditional`   | [`Turing.Inference.GibbsConditional`](@ref)   | Gibbs sampling with analytical conditional posterior distributions  |
 | `HMC`                | [`Turing.Inference.HMC`](@ref)                | Hamiltonian Monte Carlo                                             |
 | `SGLD`               | [`Turing.Inference.SGLD`](@ref)               | Stochastic gradient Langevin dynamics                               |
 | `SGHMC`              | [`Turing.Inference.SGHMC`](@ref)              | Stochastic gradient Hamiltonian Monte Carlo                         |
 
@@ -102,6 +102,7 @@ export
     Emcee,
     ESS,
     Gibbs,
+    GibbsConditional,
     HMC,
     SGLD,
     SGHMC,
 
@@ -56,6 +56,7 @@ export Hamiltonian,
     ESS,
     Emcee,
     Gibbs,      # classic sampling
+    GibbsConditional,  # conditional sampling
     HMC,
     SGLD,
     PolynomialStepsize,
@@ -433,6 +434,7 @@ include("sghmc.jl")
 include("emcee.jl")
 include("prior.jl")
 include("gibbs.jl")
+include("gibbs_conditional.jl")
 
 ################
 # Typing tools #
 
@@ -131,6 +131,7 @@ function AbstractMCMC.sample(
         N,
         n_chains;
         chain_type,
+        check_model=false, # no need to check again
         initial_params=map(_convert_initial_params, initial_params),
         kwargs...,
     )
 
@@ -0,0 +1,171 @@
+"""
+    GibbsConditional(get_cond_dists)
+
+A Gibbs component sampler that samples variables according to user-provided analytical
+conditional posterior distributions.
+
+When using Gibbs sampling, sometimes one may know the analytical form of the posterior for
+a given variable, given the conditioned values of the other variables. In such cases one can
+use `GibbsConditional` as a component sampler to to sample from these known conditionals
+directly, avoiding any MCMC methods. One does so with
+
+```julia
+sampler = Gibbs(
+    (@varname(var1), @varname(var2)) => GibbsConditional(get_cond_dists),
+    other samplers go here...
+)
+```
+
+Here `get_cond_dists(c::Dict{<:VarName})` should be a function that takes a `Dict` mapping
+the conditioned variables (anything other than `var1` and `var2`) to their values, and
+returns the conditional posterior distributions for `var1` and `var2`. You may, of course,
+have any number of variables being sampled as a block in this manner, we only use two as an
+example. The return value of `get_cond_dists` should be one of the following:
+- A single `Distribution`, if only one variable is being sampled.
+- An `AbstractDict{<:VarName,<:Distribution}` that maps the variables being sampled to their
+  conditional posteriors E.g. `Dict(@varname(var1) => dist1, @varname(var2) => dist2)`.
+- A `NamedTuple` of `Distribution`s, which is like the `AbstractDict` case but can be used
+  if all the variable names are single `Symbol`s, and may be more performant. E.g.
+  `(; var1=dist1, var2=dist2)`.
+
+# Examples
+
+```julia
+# Define a model
+@model function inverse_gdemo(x)
+    precision ~ Gamma(2, inv(3))
+    std = sqrt(1 / precision)
+    m ~ Normal(0, std)
+    for i in eachindex(x)
+        x[i] ~ Normal(m, std)
+    end
+end
+
+# Define analytical conditionals. See
+# https://en.wikipedia.org/wiki/Conjugate_prior#When_likelihood_function_is_a_continuous_distribution
+function cond_precision(c)
+    a = 2.0
+    b = 3.0
+    # We use AbstractPPL.getvalue instead of indexing into `c` directly to guard against
+    # issues where e.g. you try to get `c[@varname(x[1])]` but only `@varname(x)` is present
+    # in `c`. `getvalue` handles that gracefully, `getindex` doesn't. In this case
+    # `getindex` would suffice, but `getvalue` is good practice.
+    m = AbstractPPL.getvalue(c, @varname(m))
+    x = AbstractPPL.getvalue(c, @varname(x))
+    n = length(x)
+    a_new = a + (n + 1) / 2
+    b_new = b + sum(abs2, x .- m) / 2 + m^2 / 2
+    return Gamma(a_new, 1 / b_new)
+end
+
+function cond_m(c)
+    precision = AbstractPPL.getvalue(c, @varname(precision))
+    x = AbstractPPL.getvalue(c, @varname(x))
+    n = length(x)
+    m_mean = sum(x) / (n + 1)
+    m_var = 1 / (precision * (n + 1))
+    return Normal(m_mean, sqrt(m_var))
+end
+
+# Sample using GibbsConditional
+model = inverse_gdemo([1.0, 2.0, 3.0])
+chain = sample(model, Gibbs(
+    :precision => GibbsConditional(cond_precision),
+    :m => GibbsConditional(cond_m)
+), 1000)
+```
+"""
+struct GibbsConditional{C} <: AbstractSampler
+    get_cond_dists::C
+end
+
+isgibbscomponent(::GibbsConditional) = true
+
+"""
+    build_variable_dict(model::DynamicPPL.Model)
+
+Traverse the context stack of `model` and build a `Dict` of all the variable values that are
+set in GibbsContext, ConditionContext, or FixedContext.
+"""
+function build_variable_dict(model::DynamicPPL.Model)
+    context = model.context
+    cond_vals = DynamicPPL.conditioned(context)
+    fixed_vals = DynamicPPL.fixed(context)
+    # TODO(mhauru) Can we avoid invlinking all the time?
+    global_vi = DynamicPPL.invlink(get_gibbs_global_varinfo(context), model)
+    # TODO(mhauru) This creates a lot of Dicts, which are then immediately merged into one.
+    # Also, DynamicPPL.to_varname_dict is known to be inefficient. Make a more efficient
+    # implementation.
+    return merge(
+        DynamicPPL.values_as(global_vi, Dict),
+        DynamicPPL.to_varname_dict(cond_vals),
+        DynamicPPL.to_varname_dict(fixed_vals),
+        DynamicPPL.to_varname_dict(model.args),
+    )
+end
+
+function get_gibbs_global_varinfo(context::DynamicPPL.AbstractContext)
+    return if context isa GibbsContext
+        get_global_varinfo(context)
+    elseif DynamicPPL.NodeTrait(context) isa DynamicPPL.IsParent
+        get_gibbs_global_varinfo(DynamicPPL.childcontext(context))
+    else
+        msg = """No GibbsContext found in context stack. Are you trying to use \
+            GibbsConditional outside of Gibbs?
+            """
+        throw(ArgumentError(msg))
+    end
+end
+
+function initialstep(
+    ::Random.AbstractRNG,
+    model::DynamicPPL.Model,
+    ::GibbsConditional,
+    vi::DynamicPPL.AbstractVarInfo;
+    kwargs...,
+)
+    state = DynamicPPL.is_transformed(vi) ? DynamicPPL.invlink(vi, model) : vi
+    # Since GibbsConditional is only used within Gibbs, it does not need to return a
+    # transition.
+    return nothing, state
+end
+
+function AbstractMCMC.step(
+    rng::Random.AbstractRNG,
+    model::DynamicPPL.Model,
+    sampler::GibbsConditional,
+    state::DynamicPPL.AbstractVarInfo;
+    kwargs...,
+)
+    # Get all the conditioned variable values from the model context. This is assumed to
+    # include a GibbsContext as part of the context stack.
+    condvals = build_variable_dict(model)
+    conddists = sampler.get_cond_dists(condvals)
+
+    # We support three different kinds of return values for `sample.get_cond_dists`, to make
+    # life easier for the user.
+    if conddists isa AbstractDict
+        for (vn, dist) in conddists
+            state = setindex!!(state, rand(rng, dist), vn)
+        end
+    elseif conddists isa NamedTuple
+        for (vn_sym, dist) in pairs(conddists)
+            vn = VarName{vn_sym}()
+            state = setindex!!(state, rand(rng, dist), vn)
+        end
+    else
+        # Single variable case
+        vn = only(keys(state))
+        state = setindex!!(state, rand(rng, conddists), vn)
+    end
+
+    # Since GibbsConditional is only used within Gibbs, it does not need to return a
+    # transition.
+    return nothing, state
+end
+
+function setparams_varinfo!!(
+    ::DynamicPPL.Model, ::GibbsConditional, ::Any, params::DynamicPPL.AbstractVarInfo
+)
+    return params
+end
@@ -223,7 +223,7 @@ function Turing.Inference.initialstep(
     end
     # Generate a kernel and adaptor.
     kernel = make_ahmc_kernel(spl, ϵ)
-    adaptor = AHMCAdaptor(spl, hamiltonian.metric; ϵ=ϵ)
+    adaptor = AHMCAdaptor(spl, hamiltonian.metric, nadapts; ϵ=ϵ)
 
     transition = Transition(model, vi, NamedTuple())
     state = HMCState(vi, 1, kernel, hamiltonian, z, adaptor)
@@ -480,7 +480,9 @@ end
 #### Default HMC stepsize and mass matrix adaptor
 ####
 
-function AHMCAdaptor(alg::AdaptiveHamiltonian, metric::AHMC.AbstractMetric; ϵ=alg.ϵ)
+function AHMCAdaptor(
+    alg::AdaptiveHamiltonian, metric::AHMC.AbstractMetric, nadapts::Int; ϵ=alg.ϵ
+)
     pc = AHMC.MassMatrixAdaptor(metric)
     da = AHMC.StepSizeAdaptor(alg.δ, ϵ)
 
@@ -491,13 +493,13 @@ function AHMCAdaptor(alg::AdaptiveHamiltonian, metric::AHMC.AbstractMetric; ϵ=a
             adaptor = AHMC.NaiveHMCAdaptor(pc, da)  # there is actually no adaptation for mass matrix
         else
             adaptor = AHMC.StanHMCAdaptor(pc, da)
-            AHMC.initialize!(adaptor, alg.n_adapts)
+            AHMC.initialize!(adaptor, nadapts)
         end
     end
 
     return adaptor
 end
 
-function AHMCAdaptor(::Hamiltonian, ::AHMC.AbstractMetric; kwargs...)
+function AHMCAdaptor(::Hamiltonian, ::AHMC.AbstractMetric, nadapts::Int; kwargs...)
     return AHMC.Adaptation.NoAdaptation()
 end
@@ -21,6 +21,7 @@ LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 LogDensityProblems = "6fdf6af0-433a-55f7-b3ed-c6c6e0b8df7c"
 LogDensityProblemsAD = "996a588d-648d-4e1f-a8f0-a84b347e47b1"
 MCMCChains = "c7f686f2-ff18-58e9-bc7b-31028e88f75d"
+Mooncake = "da2b9cff-9c12-43a0-ae48-6db2b0edb7d6"
 NamedArrays = "86f7a689-2022-50b4-a561-43c23ac3c673"
 Optim = "429524aa-4258-5aef-a3af-852621145aeb"
 Optimization = "7f7a1694-90dd-40f0-9382-eb1efda571ba"
-Original file line number
+Diff line change
     Emcee,
     ESS,
     Gibbs,
 +    GibbsConditional,
     HMC,
     SGLD,
     SGHMC,
Original file line number	Diff line number	Diff line change
`@@ -131,6 +131,7 @@ function AbstractMCMC.sample(`
`131`	`131`	`N,`
`132`	`132`	`n_chains;`
`133`	`133`	`chain_type,`
	`134`	`+ check_model=false, # no need to check again`
`134`	`135`	`initial_params=map(_convert_initial_params, initial_params),`
`135`	`136`	`kwargs...,`
`136`	`137`	`)`