JasonPekos/hmm_turing.jl

## hmm_turing.jl
using Turing, HiddenMarkovModels
using PosteriorDB
using Makie, CairoMakie
using LinearAlgebra, LogExpFunctions
using DataFrames

# Get the dataset and validated reference draws from PosteriorDB
pdb = PosteriorDB.database() # Data import
data = PosteriorDB.load(PosteriorDB.dataset(pdb, "hmm_example"))
ref_post = DataFrame(PosteriorDB.load(PosteriorDB.reference_posterior(pdb, "hmm_example-hmm_example")))
ref_draws = DataFrame([vcat(ref_post[!, c]...) for c in names(ref_post)], names(ref_post))

# Plotting Function(s)
function plot_states(gq, data)
    f = Figure()
    ax = Axis(f[1, 1])

    scatter!(ax, 1:data["N"], data["y"])
    for i in eachindex(gq)
        lines!(ax, 1:data["N"], gq[i], color = :grey, alpha = 0.1)
    end

    return f
end

function plot_draws(chains, names_pair)
    f = Figure()
    ax = Axis(f[1, 1], title = "Turing vs PosteriorDB Reference Draws")

    for (i, ch) in enumerate(chains)
        scatter!(ax,
                ch[!, names_pair[1]],
                ch[!, names_pair[2]],
                alpha = 0.4,
                label = "draws $i")
    end

    return f
end

# Define The Models:
@model function example_hmm_marginalized(N, K, y)
    mu ~ MvNormal([3, 10], I)
    theta1 ~ Dirichlet(softmax(ones(K)))
    theta2 ~ Dirichlet(softmax(ones(K)))
    θ = vcat(theta1', theta2')

    hmm = HMM(softmax(ones(K)), θ, [Normal(mu[1], 1), Normal(mu[2], 1)])

    _, filtered_likelihood = forward(hmm, y)

    Turing.@addlogprob! only(filtered_likelihood)


    seq, _ = viterbi(hmm, y) # Probably do not want this in the model?
    return [mu[s] for s in seq]
end


# Sample
chn_marg = sample(example_hmm_marginalized(values(data)...), NUTS(), 1000, discard_initial = 1000)

df_chn_marg = DataFrame(chn_marg)
plot_draws([df_chn_marg, ref_draws], ["theta1[1]", "theta2[1]"])


gq = generated_quantities(example_hmm_marginalized(values(data)...), chn_marg);
plot_states(gq, data)
# Compare Reference Draws:
	using Turing, HiddenMarkovModels
	using PosteriorDB
	using Makie, CairoMakie
	using LinearAlgebra, LogExpFunctions
	using DataFrames

	# Get the dataset and validated reference draws from PosteriorDB
	pdb = PosteriorDB.database() # Data import
	data = PosteriorDB.load(PosteriorDB.dataset(pdb, "hmm_example"))
	ref_post = DataFrame(PosteriorDB.load(PosteriorDB.reference_posterior(pdb, "hmm_example-hmm_example")))
	ref_draws = DataFrame([vcat(ref_post[!, c]...) for c in names(ref_post)], names(ref_post))

	# Plotting Function(s)
	function plot_states(gq, data)
	f = Figure()
	ax = Axis(f[1, 1])

	scatter!(ax, 1:data["N"], data["y"])
	for i in eachindex(gq)
	lines!(ax, 1:data["N"], gq[i], color = :grey, alpha = 0.1)
	end

	return f
	end

	function plot_draws(chains, names_pair)
	f = Figure()
	ax = Axis(f[1, 1], title = "Turing vs PosteriorDB Reference Draws")

	for (i, ch) in enumerate(chains)
	scatter!(ax,
	ch[!, names_pair[1]],
	ch[!, names_pair[2]],
	alpha = 0.4,
	label = "draws $i")
	end

	return f
	end

	# Define The Models:
	@model function example_hmm_marginalized(N, K, y)
	mu ~ MvNormal([3, 10], I)
	theta1 ~ Dirichlet(softmax(ones(K)))
	theta2 ~ Dirichlet(softmax(ones(K)))
	θ = vcat(theta1', theta2')

	hmm = HMM(softmax(ones(K)), θ, [Normal(mu[1], 1), Normal(mu[2], 1)])

	_, filtered_likelihood = forward(hmm, y)

	Turing.@addlogprob! only(filtered_likelihood)


	seq, _ = viterbi(hmm, y) # Probably do not want this in the model?
	return [mu[s] for s in seq]
	end


	# Sample
	chn_marg = sample(example_hmm_marginalized(values(data)...), NUTS(), 1000, discard_initial = 1000)

	df_chn_marg = DataFrame(chn_marg)
	plot_draws([df_chn_marg, ref_draws], ["theta1[1]", "theta2[1]"])


	gq = generated_quantities(example_hmm_marginalized(values(data)...), chn_marg);
	plot_states(gq, data)
	# Compare Reference Draws: