Probabilistic Programming

Reactant.ProbProg is Reactant's probabilistic programming module, built on the impulse dialect.

A summary of exported symbols is provided in the Interface Overview. Please refer to the API Reference for documentation of exported symbols.

Example Usage

A generative function can be constructed using the Gen-style modeling language or trace-based mode, where the generative function is expressed with ProbProg.sample calls and the inference kernel walks the trace; and custom logpdf mode, where the user supplies a log-density function directly. Each is illustrated below with a canonical example — Bayesian linear regression for the trace-based route, and Bayesian logistic regression for the custom logpdf route.

Trace-based mode: Bayesian linear regression

With the generative function written as ordinary Julia code and each random choice named via symbol, generate folds observations into the trace and mcmc updates the unobserved addresses via NUTS. Generation and inference are fused into a single compiled program:

julia

using Reactant, Statistics
using Reactant: ProbProg, ReactantRNG

# slope     ~ Normal(0,  2)
# intercept ~ Normal(0, 10)
# yᵢ | slope, intercept ~ Normal(slope · xᵢ + intercept, 1)
function linreg(rng, xs)
    _, slope = ProbProg.sample(
        rng, ProbProg.Normal(0.0, 2.0, (1,)); symbol=:slope,
    )
    _, intercept = ProbProg.sample(
        rng, ProbProg.Normal(0.0, 10.0, (1,)); symbol=:intercept,
    )
    _, ys = ProbProg.sample(
        rng,
        ProbProg.Normal(slope .* xs .+ intercept, 1.0, (length(xs),));
        symbol=:ys,
    )
    return ys
end

xs = [1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 10.0]
ys = [8.23, 5.87, 3.99, 2.59, 0.23, -0.66, -3.53, -6.91, -7.24, -9.90]

# Fold observations into a flat constraint tensor.
obs                   = ProbProg.Constraint(:ys => ys)
constrained_addresses = ProbProg.extract_addresses(obs)
obs_flat              = Float64[]
for addr in constrained_addresses
    append!(obs_flat, vec(obs[addr]))
end
obs_tensor = Reactant.to_rarray(reshape(obs_flat, 1, :))

# `generate` conditions on observations; `mcmc` explores slope/intercept via NUTS.
function program(rng, model, xs, obs_tensor, constrained_addresses,
                 selection, step_size, inverse_mass_matrix)
    trace, _, _ = ProbProg.generate(
        rng, obs_tensor, model, xs; constrained_addresses,
    )
    trace, diag, _, _ = ProbProg.mcmc(
        rng, trace, model, xs;
        selection, algorithm = :NUTS,
        step_size, inverse_mass_matrix,
        num_warmup  = 200,
        num_samples = 500,
    )
    return trace, diag
end

seed = Reactant.to_rarray(UInt64[1, 5])
rng  = ReactantRNG(seed)
selection           = ProbProg.select(
    ProbProg.Address(:slope),
    ProbProg.Address(:intercept),
)
step_size           = Reactant.ConcreteRNumber(0.1)
inverse_mass_matrix = Reactant.ConcreteRArray([0.5 0.0; 0.0 0.5])

compiled_fn, tt = ProbProg.with_trace() do
    @compile optimize=:probprog program(
        rng, linreg, xs, obs_tensor, constrained_addresses,
        selection, step_size, inverse_mass_matrix,
    )
end

trace_tensor, _ = compiled_fn(
    rng, linreg, xs, obs_tensor, constrained_addresses,
    selection, step_size, inverse_mass_matrix,
)

selected_entries = ProbProg.filter_entries_by_selection(tt.entries, selection)
trace            = ProbProg.unflatten_trace(trace_tensor, 0.0, selected_entries, nothing)

(
    posterior_mean_slope     = mean(trace.choices[:slope][:, 1]),
    posterior_mean_intercept = mean(trace.choices[:intercept][:, 1]),
)

(posterior_mean_slope = -1.9776590686052875, posterior_mean_intercept = 10.113221093249797)

The data were generated from slope = -2, intercept = 10; NUTS recovers both posterior means.

Custom logpdf mode: Bayesian logistic regression

When a closed-form log-density is available, mcmc_logpdf skips the trace machinery. Below, a standard Normal prior on the weight vector is combined with a logistic-regression likelihood written in the numerically stable form of the binary cross-entropy:

julia

# β ~ Normal(0, I);  yᵢ | β ~ Bernoulli(σ(xᵢ · β))
# log p(β | X, y) = -½ ‖β‖²  +  Σᵢ [ yᵢ (xᵢ·β) − log(1 + exp(xᵢ·β)) ]
function logdensity(β, X, y)
    logits = X * β
    ll     = sum(y .* logits .- max.(logits, 0.0) .- log1p.(exp.(.-abs.(logits))))
    pr     = -0.5 * sum(β .^ 2)
    return ll + pr
end

# `mcmc_logpdf` is wrapped in a function that gets `@compile`d; this matches the
# pattern in `test/probprog/mcmc_logpdf.jl`.
function logreg_program(
    rng, logdensity_fn, initial_position, X, y,
    step_size, inverse_mass_matrix, num_warmup::Int, num_samples::Int,
)
    samples, _, _, state = ProbProg.mcmc_logpdf(
        rng, logdensity_fn, initial_position, X, y;
        algorithm         = :NUTS,
        step_size, inverse_mass_matrix,
        num_warmup, num_samples,
        adapt_step_size   = true,
        adapt_mass_matrix = true,
    )
    return samples, state.step_size
end

# Design matrix with an intercept column and one real-valued feature.
X_data = Float64[
    1.0 -0.5
    1.0  0.3
    1.0  0.8
    1.0 -0.2
    1.0  1.4
    1.0 -1.1
]
y_data = [0.0, 1.0, 1.0, 0.0, 1.0, 0.0]

X                   = Reactant.to_rarray(X_data)
y                   = Reactant.to_rarray(y_data)
initial_position    = Reactant.to_rarray(reshape(zeros(2), 1, 2))
step_size_lr        = Reactant.ConcreteRNumber(0.1)
inverse_mass_matrix_lr = Reactant.ConcreteRArray([1.0 0.0; 0.0 1.0])

seed_lr = Reactant.to_rarray(UInt64[2, 7])
rng_lr  = ReactantRNG(seed_lr)

compiled_lr = @compile optimize=:probprog logreg_program(
    rng_lr, logdensity, initial_position, X, y,
    step_size_lr, inverse_mass_matrix_lr, 200, 500,
)
samples, adapted_step_size = compiled_lr(
    rng_lr, logdensity, initial_position, X, y,
    step_size_lr, inverse_mass_matrix_lr, 200, 500,
)

(
    posterior_mean_β  = vec(mean(Array(samples); dims=1)),  # (intercept, slope)
    adapted_step_size = Array(adapted_step_size)[],
)

(posterior_mean_β = [-0.11050720305066576, 1.2605446188159923], adapted_step_size = 0.88991319293419)

Trace-based mode is preferable when the model is naturally expressed as a generative function and the same definition should drive forward simulation, conditioning, and inference; custom logpdf mode is preferable when a log-density implementation is already available or when integrating with an external log-density library.

Trusted by

Probabilistic Programming

Example Usage

Trace-based mode: Bayesian linear regression

Custom logpdf mode: Bayesian logistic regression

Further reading

Trusted by

Probabilistic Programming ​

Example Usage ​

Trace-based mode: Bayesian linear regression ​

Custom logpdf mode: Bayesian logistic regression ​

Further reading ​

Probabilistic Programming

Example Usage

Trace-based mode: Bayesian linear regression

Custom logpdf mode: Bayesian logistic regression

Further reading