From 677c9258f90321df480673445f1053dbf6d1b779 Mon Sep 17 00:00:00 2001
From: "Documenter.jl" <documenter@juliadocs.github.io>
Date: Fri, 12 Jul 2024 21:57:32 +0000
Subject: [PATCH] build based on 6ffa564

---
 dev/.documenter-siteinfo.json            |  2 +-
 dev/POMDPTools/beliefs/index.html        |  4 +-
 dev/POMDPTools/common_rl/index.html      |  4 +-
 dev/POMDPTools/distributions/index.html  |  4 +-
 dev/POMDPTools/index.html                |  2 +-
 dev/POMDPTools/model/index.html          | 10 +--
 dev/POMDPTools/policies/index.html       | 12 ++--
 dev/POMDPTools/simulators/index.html     | 18 ++---
 dev/POMDPTools/testing/index.html        |  4 +-
 dev/POMDPTools/visualization/index.html  |  4 +-
 dev/api/index.html                       | 40 +++++------
 dev/concepts/index.html                  |  2 +-
 dev/def_pomdp/index.html                 |  2 +-
 dev/def_solver/index.html                |  2 +-
 dev/def_updater/index.html               |  2 +-
 dev/example_defining_problems/index.html |  2 +-
 dev/example_gridworld_mdp/index.html     | 54 +++++++--------
 dev/example_simulations/index.html       | 84 ++++++++++++------------
 dev/example_solvers/index.html           | 18 ++---
 dev/examples/index.html                  |  2 +-
 dev/faq/index.html                       |  2 +-
 dev/gallery/index.html                   |  2 +-
 dev/get_started/index.html               |  2 +-
 dev/index.html                           |  2 +-
 dev/install/index.html                   |  2 +-
 dev/interfaces/index.html                |  2 +-
 dev/offline_solver/index.html            |  2 +-
 dev/online_solver/index.html             |  2 +-
 dev/policy_interaction/index.html        |  2 +-
 dev/run_simulation/index.html            |  2 +-
 dev/simulation/index.html                |  2 +-
 31 files changed, 147 insertions(+), 147 deletions(-)
diff --git a/dev/.documenter-siteinfo.json b/dev/.documenter-siteinfo.json
index 154f6a12..355f399d 100644
--- a/dev/.documenter-siteinfo.json
+++ b/dev/.documenter-siteinfo.json
@@ -1 +1 @@
-{"documenter":{"julia_version":"1.10.4","generation_timestamp":"2024-07-12T21:14:25","documenter_version":"1.5.0"}}
\ No newline at end of file
+{"documenter":{"julia_version":"1.10.4","generation_timestamp":"2024-07-12T21:57:27","documenter_version":"1.5.0"}}
\ No newline at end of file
diff --git a/dev/POMDPTools/beliefs/index.html b/dev/POMDPTools/beliefs/index.html
index 3b3e8f1a..6e9a48ea 100644
--- a/dev/POMDPTools/beliefs/index.html
+++ b/dev/POMDPTools/beliefs/index.html
@@ -1,7 +1,7 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Implemented Belief Updaters · POMDPs.jl</title><meta name="title" content="Implemented Belief Updaters · POMDPs.jl"/><meta property="og:title" content="Implemented Belief Updaters · POMDPs.jl"/><meta property="twitter:title" content="Implemented Belief Updaters · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li><a class="tocitem" href="../visualization/">Visualization</a></li><li class="is-active"><a class="tocitem" href>Implemented Belief Updaters</a><ul class="internal"><li><a class="tocitem" href="#Discrete-(Bayesian-Filter)"><span>Discrete (Bayesian Filter)</span></a></li><li><a class="tocitem" href="#K-Previous-Observations"><span>K Previous Observations</span></a></li><li><a class="tocitem" href="#Previous-Observation"><span>Previous Observation</span></a></li><li><a class="tocitem" href="#Nothing-Updater"><span>Nothing Updater</span></a></li></ul></li><li><a class="tocitem" href="../policies/">Implemented Policies</a></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Implemented Belief Updaters</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Implemented Belief Updaters</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/beliefs.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Implemented-Belief-Updaters"><a class="docs-heading-anchor" href="#Implemented-Belief-Updaters">Implemented Belief Updaters</a><a id="Implemented-Belief-Updaters-1"></a><a class="docs-heading-anchor-permalink" href="#Implemented-Belief-Updaters" title="Permalink"></a></h1><p>POMDPTools provides the following generic belief updaters:</p><ul><li>a discrete belief updater</li><li>a k previous observation updater</li><li>a previous observation updater </li><li>a nothing updater (for when the policy does not depend on any feedback)</li></ul><p>For particle filters see <a href="https://github.com/JuliaPOMDP/ParticleFilters.jl">ParticleFilters.jl</a>.</p><h2 id="Discrete-(Bayesian-Filter)"><a class="docs-heading-anchor" href="#Discrete-(Bayesian-Filter)">Discrete (Bayesian Filter)</a><a id="Discrete-(Bayesian-Filter)-1"></a><a class="docs-heading-anchor-permalink" href="#Discrete-(Bayesian-Filter)" title="Permalink"></a></h2><p>The <code>DiscreteUpater</code> is a default implementation of a discrete Bayesian filter. The <code>DiscreteBelief</code> type is provided to represent discrete beliefs for discrete state POMDPs. </p><p>A convenience function <code>uniform_belief</code> is provided to create a <code>DiscreteBelief</code> with equal probability for each state. </p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.DiscreteBelief" href="#POMDPTools.BeliefUpdaters.DiscreteBelief"><code>POMDPTools.BeliefUpdaters.DiscreteBelief</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">DiscreteBelief</code></pre><p>A belief specified by a probability vector.</p><p>Normalization of <code>b</code> is assumed in some calculations (e.g. pdf), but it is only automatically enforced in <code>update(...)</code>, and a warning is given if normalized incorrectly in <code>DiscreteBelief(pomdp, b)</code>.</p><p><strong>Constructor</strong></p><pre><code class="nohighlight hljs">DiscreteBelief(pomdp, b::Vector{Float64}; check::Bool=true)</code></pre><p><strong>Fields</strong></p><ul><li><code>pomdp</code> : the POMDP problem</li><li><code>state_list</code> : a vector of ordered states</li><li><code>b</code> : the probability vector</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/BeliefUpdaters/discrete.jl#L6-L20">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.DiscreteUpdater" href="#POMDPTools.BeliefUpdaters.DiscreteUpdater"><code>POMDPTools.BeliefUpdaters.DiscreteUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">DiscreteUpdater</code></pre><p>An updater type to update discrete belief using the discrete Bayesian filter.</p><p><strong>Constructor</strong></p><pre><code class="nohighlight hljs">DiscreteUpdater(pomdp::POMDP)</code></pre><p><strong>Fields</strong></p><ul><li><code>pomdp &lt;: POMDP</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/BeliefUpdaters/discrete.jl#L98-L108">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.uniform_belief-Tuple{Any}" href="#POMDPTools.BeliefUpdaters.uniform_belief-Tuple{Any}"><code>POMDPTools.BeliefUpdaters.uniform_belief</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia hljs"> uniform_belief(pomdp)</code></pre><p>Return a DiscreteBelief with equal probability for each state.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/BeliefUpdaters/discrete.jl#L64-L68">source</a></section></article><h2 id="K-Previous-Observations"><a class="docs-heading-anchor" href="#K-Previous-Observations">K Previous Observations</a><a id="K-Previous-Observations-1"></a><a class="docs-heading-anchor-permalink" href="#K-Previous-Observations" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.KMarkovUpdater" href="#POMDPTools.BeliefUpdaters.KMarkovUpdater"><code>POMDPTools.BeliefUpdaters.KMarkovUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">KMarkovUpdater</code></pre><p>Updater that stores the k most recent observations as the belief.</p><p>Example:</p><pre><code class="language-julia hljs">up = KMarkovUpdater(5)
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Implemented Belief Updaters · POMDPs.jl</title><meta name="title" content="Implemented Belief Updaters · POMDPs.jl"/><meta property="og:title" content="Implemented Belief Updaters · POMDPs.jl"/><meta property="twitter:title" content="Implemented Belief Updaters · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li><a class="tocitem" href="../visualization/">Visualization</a></li><li class="is-active"><a class="tocitem" href>Implemented Belief Updaters</a><ul class="internal"><li><a class="tocitem" href="#Discrete-(Bayesian-Filter)"><span>Discrete (Bayesian Filter)</span></a></li><li><a class="tocitem" href="#K-Previous-Observations"><span>K Previous Observations</span></a></li><li><a class="tocitem" href="#Previous-Observation"><span>Previous Observation</span></a></li><li><a class="tocitem" href="#Nothing-Updater"><span>Nothing Updater</span></a></li></ul></li><li><a class="tocitem" href="../policies/">Implemented Policies</a></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Implemented Belief Updaters</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Implemented Belief Updaters</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/beliefs.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Implemented-Belief-Updaters"><a class="docs-heading-anchor" href="#Implemented-Belief-Updaters">Implemented Belief Updaters</a><a id="Implemented-Belief-Updaters-1"></a><a class="docs-heading-anchor-permalink" href="#Implemented-Belief-Updaters" title="Permalink"></a></h1><p>POMDPTools provides the following generic belief updaters:</p><ul><li>a discrete belief updater</li><li>a k previous observation updater</li><li>a previous observation updater </li><li>a nothing updater (for when the policy does not depend on any feedback)</li></ul><p>For particle filters see <a href="https://github.com/JuliaPOMDP/ParticleFilters.jl">ParticleFilters.jl</a>.</p><h2 id="Discrete-(Bayesian-Filter)"><a class="docs-heading-anchor" href="#Discrete-(Bayesian-Filter)">Discrete (Bayesian Filter)</a><a id="Discrete-(Bayesian-Filter)-1"></a><a class="docs-heading-anchor-permalink" href="#Discrete-(Bayesian-Filter)" title="Permalink"></a></h2><p>The <code>DiscreteUpater</code> is a default implementation of a discrete Bayesian filter. The <code>DiscreteBelief</code> type is provided to represent discrete beliefs for discrete state POMDPs. </p><p>A convenience function <code>uniform_belief</code> is provided to create a <code>DiscreteBelief</code> with equal probability for each state. </p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.DiscreteBelief" href="#POMDPTools.BeliefUpdaters.DiscreteBelief"><code>POMDPTools.BeliefUpdaters.DiscreteBelief</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">DiscreteBelief</code></pre><p>A belief specified by a probability vector.</p><p>Normalization of <code>b</code> is assumed in some calculations (e.g. pdf), but it is only automatically enforced in <code>update(...)</code>, and a warning is given if normalized incorrectly in <code>DiscreteBelief(pomdp, b)</code>.</p><p><strong>Constructor</strong></p><pre><code class="nohighlight hljs">DiscreteBelief(pomdp, b::Vector{Float64}; check::Bool=true)</code></pre><p><strong>Fields</strong></p><ul><li><code>pomdp</code> : the POMDP problem</li><li><code>state_list</code> : a vector of ordered states</li><li><code>b</code> : the probability vector</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/BeliefUpdaters/discrete.jl#L6-L20">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.DiscreteUpdater" href="#POMDPTools.BeliefUpdaters.DiscreteUpdater"><code>POMDPTools.BeliefUpdaters.DiscreteUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">DiscreteUpdater</code></pre><p>An updater type to update discrete belief using the discrete Bayesian filter.</p><p><strong>Constructor</strong></p><pre><code class="nohighlight hljs">DiscreteUpdater(pomdp::POMDP)</code></pre><p><strong>Fields</strong></p><ul><li><code>pomdp &lt;: POMDP</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/BeliefUpdaters/discrete.jl#L98-L108">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.uniform_belief-Tuple{Any}" href="#POMDPTools.BeliefUpdaters.uniform_belief-Tuple{Any}"><code>POMDPTools.BeliefUpdaters.uniform_belief</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia hljs"> uniform_belief(pomdp)</code></pre><p>Return a DiscreteBelief with equal probability for each state.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/BeliefUpdaters/discrete.jl#L64-L68">source</a></section></article><h2 id="K-Previous-Observations"><a class="docs-heading-anchor" href="#K-Previous-Observations">K Previous Observations</a><a id="K-Previous-Observations-1"></a><a class="docs-heading-anchor-permalink" href="#K-Previous-Observations" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.KMarkovUpdater" href="#POMDPTools.BeliefUpdaters.KMarkovUpdater"><code>POMDPTools.BeliefUpdaters.KMarkovUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">KMarkovUpdater</code></pre><p>Updater that stores the k most recent observations as the belief.</p><p>Example:</p><pre><code class="language-julia hljs">up = KMarkovUpdater(5)
 s0 = rand(rng, initialstate(pomdp))
 initial_observation = rand(rng, initialobs(pomdp, s0))
 initial_obs_vec = fill(initial_observation, 5)
 hr = HistoryRecorder(rng=rng, max_steps=100)
-hist = simulate(hr, pomdp, policy, up, initial_obs_vec, s0)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/BeliefUpdaters/k_previous_observations.jl#L1-L16">source</a></section></article><h2 id="Previous-Observation"><a class="docs-heading-anchor" href="#Previous-Observation">Previous Observation</a><a id="Previous-Observation-1"></a><a class="docs-heading-anchor-permalink" href="#Previous-Observation" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.PreviousObservationUpdater" href="#POMDPTools.BeliefUpdaters.PreviousObservationUpdater"><code>POMDPTools.BeliefUpdaters.PreviousObservationUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Updater that stores the most recent observation as the belief. If an initial distribution is provided, it will pass that as the initial belief.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/BeliefUpdaters/previous_observation.jl#L6-L8">source</a></section></article><h2 id="Nothing-Updater"><a class="docs-heading-anchor" href="#Nothing-Updater">Nothing Updater</a><a id="Nothing-Updater-1"></a><a class="docs-heading-anchor-permalink" href="#Nothing-Updater" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.NothingUpdater" href="#POMDPTools.BeliefUpdaters.NothingUpdater"><code>POMDPTools.BeliefUpdaters.NothingUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><p>An updater useful for when a belief is not necessary (i.e. for a random policy). <code>update</code> always returns <code>nothing</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/BeliefUpdaters/void.jl#L4-L6">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../visualization/">« Visualization</a><a class="docs-footer-nextpage" href="../policies/">Implemented Policies »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+hist = simulate(hr, pomdp, policy, up, initial_obs_vec, s0)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/BeliefUpdaters/k_previous_observations.jl#L1-L16">source</a></section></article><h2 id="Previous-Observation"><a class="docs-heading-anchor" href="#Previous-Observation">Previous Observation</a><a id="Previous-Observation-1"></a><a class="docs-heading-anchor-permalink" href="#Previous-Observation" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.PreviousObservationUpdater" href="#POMDPTools.BeliefUpdaters.PreviousObservationUpdater"><code>POMDPTools.BeliefUpdaters.PreviousObservationUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Updater that stores the most recent observation as the belief. If an initial distribution is provided, it will pass that as the initial belief.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/BeliefUpdaters/previous_observation.jl#L6-L8">source</a></section></article><h2 id="Nothing-Updater"><a class="docs-heading-anchor" href="#Nothing-Updater">Nothing Updater</a><a id="Nothing-Updater-1"></a><a class="docs-heading-anchor-permalink" href="#Nothing-Updater" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.BeliefUpdaters.NothingUpdater" href="#POMDPTools.BeliefUpdaters.NothingUpdater"><code>POMDPTools.BeliefUpdaters.NothingUpdater</code></a> — <span class="docstring-category">Type</span></header><section><div><p>An updater useful for when a belief is not necessary (i.e. for a random policy). <code>update</code> always returns <code>nothing</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/BeliefUpdaters/void.jl#L4-L6">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../visualization/">« Visualization</a><a class="docs-footer-nextpage" href="../policies/">Implemented Policies »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/common_rl/index.html b/dev/POMDPTools/common_rl/index.html
index 40e06adf..2436a5c2 100644
--- a/dev/POMDPTools/common_rl/index.html
+++ b/dev/POMDPTools/common_rl/index.html
@@ -12,5 +12,5 @@
 m = convert(POMDP, env)
 planner = solve(POMCPSolver(), m)
 a = action(planner, initialstate(m))</code></pre><p>You can also use the constructors listed below to manually convert between the interfaces.</p><h2 id="Environment-Wrapper-Types"><a class="docs-heading-anchor" href="#Environment-Wrapper-Types">Environment Wrapper Types</a><a id="Environment-Wrapper-Types-1"></a><a class="docs-heading-anchor-permalink" href="#Environment-Wrapper-Types" title="Permalink"></a></h2><p>Since the standard reinforcement learning environment interface offers less information about the internal workings of the environment than the POMDPs.jl interface, MDPs and POMDPs created from these environments will have limited functionality. There are two types of (PO)MDP types that can wrap an environment:</p><h3 id="Generative-model-wrappers"><a class="docs-heading-anchor" href="#Generative-model-wrappers">Generative model wrappers</a><a id="Generative-model-wrappers-1"></a><a class="docs-heading-anchor-permalink" href="#Generative-model-wrappers" title="Permalink"></a></h3><p>If the <code>state</code> and <code>setstate!</code> CommonRLInterface functions are provided, then the environment can be wrapped in a <a href="#POMDPTools.CommonRLIntegration.RLEnvMDP"><code>RLEnvMDP</code></a> or <a href="#POMDPTools.CommonRLIntegration.RLEnvPOMDP"><code>RLEnvPOMDP</code></a> and the POMDPs.jl generative model interface will be available.</p><h3 id="Opaque-wrappers"><a class="docs-heading-anchor" href="#Opaque-wrappers">Opaque wrappers</a><a id="Opaque-wrappers-1"></a><a class="docs-heading-anchor-permalink" href="#Opaque-wrappers" title="Permalink"></a></h3><p>If the <code>state</code> and <code>setstate!</code> are not provided, then the resulting <code>POMDP</code> or <code>MDP</code> can only be simulated. This case is represented using the <a href="#POMDPTools.CommonRLIntegration.OpaqueRLEnvPOMDP"><code>OpaqueRLEnvPOMDP</code></a> and <a href="#POMDPTools.CommonRLIntegration.OpaqueRLEnvMDP"><code>OpaqueRLEnvMDP</code></a> wrappers. From the POMDPs.jl perspective, the state of the opaque (PO)MDP is just an integer wrapped in an <code>OpaqueRLEnvState</code>. This keeps track of the &quot;age&quot; of the environment so that POMDPs.jl actions that attempt to interact with the environment at a different age are invalid.</p><h2 id="Constructors"><a class="docs-heading-anchor" href="#Constructors">Constructors</a><a id="Constructors-1"></a><a class="docs-heading-anchor-permalink" href="#Constructors" title="Permalink"></a></h2><h3 id="Creating-RL-environments-from-MDPs-and-POMDPs"><a class="docs-heading-anchor" href="#Creating-RL-environments-from-MDPs-and-POMDPs">Creating RL environments from MDPs and POMDPs</a><a id="Creating-RL-environments-from-MDPs-and-POMDPs-1"></a><a class="docs-heading-anchor-permalink" href="#Creating-RL-environments-from-MDPs-and-POMDPs" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.MDPCommonRLEnv" href="#POMDPTools.CommonRLIntegration.MDPCommonRLEnv"><code>POMDPTools.CommonRLIntegration.MDPCommonRLEnv</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">MDPCommonRLEnv(m, [s])
-MDPCommonRLEnv{RLO}(m, [s])</code></pre><p>Create a CommonRLInterface environment from MDP m; optionally specify the state &#39;s&#39;.</p><p>The <code>RLO</code> parameter can be used to specify a type to convert the observation to. By default, this is <code>AbstractArray</code>. Use <code>Any</code> to disable conversion.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/CommonRLIntegration/to_env.jl#L13-L20">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.POMDPCommonRLEnv" href="#POMDPTools.CommonRLIntegration.POMDPCommonRLEnv"><code>POMDPTools.CommonRLIntegration.POMDPCommonRLEnv</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">POMDPCommonRLEnv(m, [s], [o])
-POMDPCommonRLEnv{RLO}(m, [s], [o])</code></pre><p>Create a CommonRLInterface environment from POMDP m; optionally specify the state &#39;s&#39; and observation &#39;o&#39;.</p><p>The <code>RLO</code> and <code>RLS</code> parameters can be used to specify types to convert the observation and state to. By default, this is <code>AbstractArray</code>. Use <code>Any</code> to disable conversion.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/CommonRLIntegration/to_env.jl#L56-L63">source</a></section></article><h3 id="Creating-MDPs-and-POMDPs-from-RL-environments"><a class="docs-heading-anchor" href="#Creating-MDPs-and-POMDPs-from-RL-environments">Creating MDPs and POMDPs from RL environments</a><a id="Creating-MDPs-and-POMDPs-from-RL-environments-1"></a><a class="docs-heading-anchor-permalink" href="#Creating-MDPs-and-POMDPs-from-RL-environments" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.RLEnvMDP" href="#POMDPTools.CommonRLIntegration.RLEnvMDP"><code>POMDPTools.CommonRLIntegration.RLEnvMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">RLEnvMDP(env; discount=1.0)</code></pre><p>Create an <code>MDP</code> by wrapping a <code>CommonRLInterface.AbstractEnv</code>. <code>state</code> and <code>setstate!</code> from <code>CommonRLInterface</code> must be provided, and the <code>POMDPs</code> generative model functionality will be provided.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L51-L55">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.RLEnvPOMDP" href="#POMDPTools.CommonRLIntegration.RLEnvPOMDP"><code>POMDPTools.CommonRLIntegration.RLEnvPOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">RLEnvPOMDP(env; discount=1.0)</code></pre><p>Create an <code>POMDP</code> by wrapping a <code>CommonRLInterface.AbstractEnv</code>. <code>state</code> and <code>setstate!</code> from <code>CommonRLInterface</code> must be provided, and the <code>POMDPs</code> generative model functionality will be provided.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L73-L77">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.OpaqueRLEnvMDP" href="#POMDPTools.CommonRLIntegration.OpaqueRLEnvMDP"><code>POMDPTools.CommonRLIntegration.OpaqueRLEnvMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">OpaqueRLEnvMDP(env; discount=1.0)</code></pre><p>Wrap a <code>CommonRLInterface.AbstractEnv</code> in an <code>MDP</code> object. The state will be an <code>OpaqueRLEnvState</code> and only simulation will be supported.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L119-L123">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.OpaqueRLEnvPOMDP" href="#POMDPTools.CommonRLIntegration.OpaqueRLEnvPOMDP"><code>POMDPTools.CommonRLIntegration.OpaqueRLEnvPOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">OpaqueRLEnvPOMDP(env; discount=1.0)</code></pre><p>Wrap a <code>CommonRLInterface.AbstractEnv</code> in an <code>POMDP</code> object. The state will be an <code>OpaqueRLEnvState</code> and only simulation will be supported.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L134-L138">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../simulators/">« Implemented Simulators</a><a class="docs-footer-nextpage" href="../testing/">Testing »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+MDPCommonRLEnv{RLO}(m, [s])</code></pre><p>Create a CommonRLInterface environment from MDP m; optionally specify the state &#39;s&#39;.</p><p>The <code>RLO</code> parameter can be used to specify a type to convert the observation to. By default, this is <code>AbstractArray</code>. Use <code>Any</code> to disable conversion.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/CommonRLIntegration/to_env.jl#L13-L20">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.POMDPCommonRLEnv" href="#POMDPTools.CommonRLIntegration.POMDPCommonRLEnv"><code>POMDPTools.CommonRLIntegration.POMDPCommonRLEnv</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">POMDPCommonRLEnv(m, [s], [o])
+POMDPCommonRLEnv{RLO}(m, [s], [o])</code></pre><p>Create a CommonRLInterface environment from POMDP m; optionally specify the state &#39;s&#39; and observation &#39;o&#39;.</p><p>The <code>RLO</code> and <code>RLS</code> parameters can be used to specify types to convert the observation and state to. By default, this is <code>AbstractArray</code>. Use <code>Any</code> to disable conversion.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/CommonRLIntegration/to_env.jl#L56-L63">source</a></section></article><h3 id="Creating-MDPs-and-POMDPs-from-RL-environments"><a class="docs-heading-anchor" href="#Creating-MDPs-and-POMDPs-from-RL-environments">Creating MDPs and POMDPs from RL environments</a><a id="Creating-MDPs-and-POMDPs-from-RL-environments-1"></a><a class="docs-heading-anchor-permalink" href="#Creating-MDPs-and-POMDPs-from-RL-environments" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.RLEnvMDP" href="#POMDPTools.CommonRLIntegration.RLEnvMDP"><code>POMDPTools.CommonRLIntegration.RLEnvMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">RLEnvMDP(env; discount=1.0)</code></pre><p>Create an <code>MDP</code> by wrapping a <code>CommonRLInterface.AbstractEnv</code>. <code>state</code> and <code>setstate!</code> from <code>CommonRLInterface</code> must be provided, and the <code>POMDPs</code> generative model functionality will be provided.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L51-L55">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.RLEnvPOMDP" href="#POMDPTools.CommonRLIntegration.RLEnvPOMDP"><code>POMDPTools.CommonRLIntegration.RLEnvPOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">RLEnvPOMDP(env; discount=1.0)</code></pre><p>Create an <code>POMDP</code> by wrapping a <code>CommonRLInterface.AbstractEnv</code>. <code>state</code> and <code>setstate!</code> from <code>CommonRLInterface</code> must be provided, and the <code>POMDPs</code> generative model functionality will be provided.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L73-L77">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.OpaqueRLEnvMDP" href="#POMDPTools.CommonRLIntegration.OpaqueRLEnvMDP"><code>POMDPTools.CommonRLIntegration.OpaqueRLEnvMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">OpaqueRLEnvMDP(env; discount=1.0)</code></pre><p>Wrap a <code>CommonRLInterface.AbstractEnv</code> in an <code>MDP</code> object. The state will be an <code>OpaqueRLEnvState</code> and only simulation will be supported.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L119-L123">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.CommonRLIntegration.OpaqueRLEnvPOMDP" href="#POMDPTools.CommonRLIntegration.OpaqueRLEnvPOMDP"><code>POMDPTools.CommonRLIntegration.OpaqueRLEnvPOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">OpaqueRLEnvPOMDP(env; discount=1.0)</code></pre><p>Wrap a <code>CommonRLInterface.AbstractEnv</code> in an <code>POMDP</code> object. The state will be an <code>OpaqueRLEnvState</code> and only simulation will be supported.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/CommonRLIntegration/from_env.jl#L134-L138">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../simulators/">« Implemented Simulators</a><a class="docs-footer-nextpage" href="../testing/">Testing »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/distributions/index.html b/dev/POMDPTools/distributions/index.html
index e49c8b7f..06df77fa 100644
--- a/dev/POMDPTools/distributions/index.html
+++ b/dev/POMDPTools/distributions/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Implemented Distributions · POMDPs.jl</title><meta name="title" content="Implemented Distributions · POMDPs.jl"/><meta property="og:title" content="Implemented Distributions · POMDPs.jl"/><meta property="twitter:title" content="Implemented Distributions · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li class="is-active"><a class="tocitem" href>Implemented Distributions</a><ul class="internal"><li><a class="tocitem" href="#Sparse-Categorical-(SparseCat)"><span>Sparse Categorical (<code>SparseCat</code>)</span></a></li><li><a class="tocitem" href="#Implicit"><span>Implicit</span></a></li><li><a class="tocitem" href="#Bool-Distribution"><span>Bool Distribution</span></a></li><li><a class="tocitem" href="#Deterministic"><span>Deterministic</span></a></li><li><a class="tocitem" href="#Uniform"><span>Uniform</span></a></li><li><a class="tocitem" href="#Pretty-Printing"><span>Pretty Printing</span></a></li></ul></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li><a class="tocitem" href="../visualization/">Visualization</a></li><li><a class="tocitem" href="../beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../policies/">Implemented Policies</a></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Implemented Distributions</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Implemented Distributions</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/distributions.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Implemented-Distributions"><a class="docs-heading-anchor" href="#Implemented-Distributions">Implemented Distributions</a><a id="Implemented-Distributions-1"></a><a class="docs-heading-anchor-permalink" href="#Implemented-Distributions" title="Permalink"></a></h1><p>POMDPTools contains several utility distributions to be used in the POMDPs <code>transition</code> and <code>observation</code> functions. These implement the appropriate methods of the functions in the <a href="../../interfaces/#Distributions">distributions interface</a>.</p><p>This package also supplies <a href="#POMDPTools.POMDPDistributions.showdistribution"><code>showdistribution</code></a> for pretty printing distributions as unicode bar graphs to the terminal.</p><h2 id="Sparse-Categorical-(SparseCat)"><a class="docs-heading-anchor" href="#Sparse-Categorical-(SparseCat)">Sparse Categorical (<code>SparseCat</code>)</a><a id="Sparse-Categorical-(SparseCat)-1"></a><a class="docs-heading-anchor-permalink" href="#Sparse-Categorical-(SparseCat)" title="Permalink"></a></h2><p><code>SparseCat</code> is a sparse categorical distribution which is specified by simply providing a list of possible values (states or observations) and the probabilities corresponding to those particular objects.</p><p>Example: <code>SparseCat([1,2,3], [0.1,0.2,0.7])</code> is a categorical distribution that assigns probability 0.1 to <code>1</code>, 0.2 to <code>2</code>, 0.7 to <code>3</code>, and 0 to all other values.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.SparseCat" href="#POMDPTools.POMDPDistributions.SparseCat"><code>POMDPTools.POMDPDistributions.SparseCat</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SparseCat(values, probabilities)</code></pre><p>Create a sparse categorical distribution.</p><p><code>values</code> is an iterable object containing the possible values (can be of any type) in the distribution that have nonzero probability. <code>probabilities</code> is an iterable object that contains the associated probabilities.</p><p>This is optimized for value iteration with a fast implementation of <code>weighted_iterator</code>. Both <code>pdf</code> and <code>rand</code> are order n.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/sparse_cat.jl#L1-L9">source</a></section></article><h2 id="Implicit"><a class="docs-heading-anchor" href="#Implicit">Implicit</a><a id="Implicit-1"></a><a class="docs-heading-anchor-permalink" href="#Implicit" title="Permalink"></a></h2><p>In situations where a distribution object is required, but the pdf is difficult to specify and only samples are required, <code>ImplicitDistribution</code> provides a convenient way to package a sampling function.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.ImplicitDistribution" href="#POMDPTools.POMDPDistributions.ImplicitDistribution"><code>POMDPTools.POMDPDistributions.ImplicitDistribution</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">ImplicitDistribution(sample_function, args...)</code></pre><p>Define a distribution that can only be sampled from using <code>rand</code>, but has no explicit <code>pdf</code>.</p><p>Each time <code>rand(rng, d::ImplicitDistribution)</code> is called,</p><pre><code class="language-julia hljs">sample_function(args..., rng)</code></pre><p>will be called to generate a new sample.</p><p><code>ImplicitDistribution</code> is designed to be used with anonymous functions or the <code>do</code> syntax as follows:</p><p><strong>Examples</strong></p><pre><code class="language-julia hljs">ImplicitDistribution(rng-&gt;rand(rng)^2)</code></pre><pre><code class="language-julia hljs">struct MyMDP &lt;: MDP{Float64, Int} end
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Implemented Distributions · POMDPs.jl</title><meta name="title" content="Implemented Distributions · POMDPs.jl"/><meta property="og:title" content="Implemented Distributions · POMDPs.jl"/><meta property="twitter:title" content="Implemented Distributions · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li class="is-active"><a class="tocitem" href>Implemented Distributions</a><ul class="internal"><li><a class="tocitem" href="#Sparse-Categorical-(SparseCat)"><span>Sparse Categorical (<code>SparseCat</code>)</span></a></li><li><a class="tocitem" href="#Implicit"><span>Implicit</span></a></li><li><a class="tocitem" href="#Bool-Distribution"><span>Bool Distribution</span></a></li><li><a class="tocitem" href="#Deterministic"><span>Deterministic</span></a></li><li><a class="tocitem" href="#Uniform"><span>Uniform</span></a></li><li><a class="tocitem" href="#Pretty-Printing"><span>Pretty Printing</span></a></li></ul></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li><a class="tocitem" href="../visualization/">Visualization</a></li><li><a class="tocitem" href="../beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../policies/">Implemented Policies</a></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Implemented Distributions</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Implemented Distributions</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/distributions.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Implemented-Distributions"><a class="docs-heading-anchor" href="#Implemented-Distributions">Implemented Distributions</a><a id="Implemented-Distributions-1"></a><a class="docs-heading-anchor-permalink" href="#Implemented-Distributions" title="Permalink"></a></h1><p>POMDPTools contains several utility distributions to be used in the POMDPs <code>transition</code> and <code>observation</code> functions. These implement the appropriate methods of the functions in the <a href="../../interfaces/#Distributions">distributions interface</a>.</p><p>This package also supplies <a href="#POMDPTools.POMDPDistributions.showdistribution"><code>showdistribution</code></a> for pretty printing distributions as unicode bar graphs to the terminal.</p><h2 id="Sparse-Categorical-(SparseCat)"><a class="docs-heading-anchor" href="#Sparse-Categorical-(SparseCat)">Sparse Categorical (<code>SparseCat</code>)</a><a id="Sparse-Categorical-(SparseCat)-1"></a><a class="docs-heading-anchor-permalink" href="#Sparse-Categorical-(SparseCat)" title="Permalink"></a></h2><p><code>SparseCat</code> is a sparse categorical distribution which is specified by simply providing a list of possible values (states or observations) and the probabilities corresponding to those particular objects.</p><p>Example: <code>SparseCat([1,2,3], [0.1,0.2,0.7])</code> is a categorical distribution that assigns probability 0.1 to <code>1</code>, 0.2 to <code>2</code>, 0.7 to <code>3</code>, and 0 to all other values.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.SparseCat" href="#POMDPTools.POMDPDistributions.SparseCat"><code>POMDPTools.POMDPDistributions.SparseCat</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SparseCat(values, probabilities)</code></pre><p>Create a sparse categorical distribution.</p><p><code>values</code> is an iterable object containing the possible values (can be of any type) in the distribution that have nonzero probability. <code>probabilities</code> is an iterable object that contains the associated probabilities.</p><p>This is optimized for value iteration with a fast implementation of <code>weighted_iterator</code>. Both <code>pdf</code> and <code>rand</code> are order n.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/sparse_cat.jl#L1-L9">source</a></section></article><h2 id="Implicit"><a class="docs-heading-anchor" href="#Implicit">Implicit</a><a id="Implicit-1"></a><a class="docs-heading-anchor-permalink" href="#Implicit" title="Permalink"></a></h2><p>In situations where a distribution object is required, but the pdf is difficult to specify and only samples are required, <code>ImplicitDistribution</code> provides a convenient way to package a sampling function.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.ImplicitDistribution" href="#POMDPTools.POMDPDistributions.ImplicitDistribution"><code>POMDPTools.POMDPDistributions.ImplicitDistribution</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">ImplicitDistribution(sample_function, args...)</code></pre><p>Define a distribution that can only be sampled from using <code>rand</code>, but has no explicit <code>pdf</code>.</p><p>Each time <code>rand(rng, d::ImplicitDistribution)</code> is called,</p><pre><code class="language-julia hljs">sample_function(args..., rng)</code></pre><p>will be called to generate a new sample.</p><p><code>ImplicitDistribution</code> is designed to be used with anonymous functions or the <code>do</code> syntax as follows:</p><p><strong>Examples</strong></p><pre><code class="language-julia hljs">ImplicitDistribution(rng-&gt;rand(rng)^2)</code></pre><pre><code class="language-julia hljs">struct MyMDP &lt;: MDP{Float64, Int} end
 
 function POMDPs.transition(m::MyMDP, s, a)
     ImplicitDistribution(s, a) do s, a, rng
@@ -8,4 +8,4 @@
 end
 
 td = transition(MyMDP(), 1.0, 1)
-rand(td) # will return a number near 2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/implicit.jl#L1-L32">source</a></section></article><h2 id="Bool-Distribution"><a class="docs-heading-anchor" href="#Bool-Distribution">Bool Distribution</a><a id="Bool-Distribution-1"></a><a class="docs-heading-anchor-permalink" href="#Bool-Distribution" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.BoolDistribution" href="#POMDPTools.POMDPDistributions.BoolDistribution"><code>POMDPTools.POMDPDistributions.BoolDistribution</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">BoolDistribution(p_true)</code></pre><p>Create a distribution over Boolean values (<code>true</code> or <code>false</code>).</p><p><code>p_true</code> is the probability of the <code>true</code> outcome; the probability of <code>false</code> is 1-<code>p_true</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/bool.jl#L1-L7">source</a></section></article><h2 id="Deterministic"><a class="docs-heading-anchor" href="#Deterministic">Deterministic</a><a id="Deterministic-1"></a><a class="docs-heading-anchor-permalink" href="#Deterministic" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.Deterministic" href="#POMDPTools.POMDPDistributions.Deterministic"><code>POMDPTools.POMDPDistributions.Deterministic</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">Deterministic(value)</code></pre><p>Create a deterministic distribution over only one value.</p><p>This is intended to be used when a distribution is required, but the outcome is deterministic. It is equivalent to a Kronecker Delta distribution.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/deterministic.jl#L1-L7">source</a></section></article><h2 id="Uniform"><a class="docs-heading-anchor" href="#Uniform">Uniform</a><a id="Uniform-1"></a><a class="docs-heading-anchor-permalink" href="#Uniform" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.Uniform" href="#POMDPTools.POMDPDistributions.Uniform"><code>POMDPTools.POMDPDistributions.Uniform</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">Uniform(collection)</code></pre><p>Create a uniform categorical distribution over a collection of objects.</p><p>The objects in the collection must be unique (this is tested on construction), and will be stored in a <code>Set</code>. To avoid this overhead, use <code>UnsafeUniform</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/uniform.jl#L5-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.UnsafeUniform" href="#POMDPTools.POMDPDistributions.UnsafeUniform"><code>POMDPTools.POMDPDistributions.UnsafeUniform</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">UnsafeUniform(collection)</code></pre><p>Create a uniform categorical distribution over a collection of objects.</p><p>No checks are performed to ensure uniqueness or check whether an object is actually in the set when evaluating the pdf.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/uniform.jl#L39-L45">source</a></section></article><h2 id="Pretty-Printing"><a class="docs-heading-anchor" href="#Pretty-Printing">Pretty Printing</a><a id="Pretty-Printing-1"></a><a class="docs-heading-anchor-permalink" href="#Pretty-Printing" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.showdistribution" href="#POMDPTools.POMDPDistributions.showdistribution"><code>POMDPTools.POMDPDistributions.showdistribution</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">showdistribution([io], [mime], d)</code></pre><p>Show a UnicodePlots.barplot representation of a distribution.</p><p><strong>Keyword Arguments</strong></p><ul><li><code>title::String=string(typeof(d))*&quot; distribution&quot;</code>: title for the barplot. </li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/pretty_printing.jl#L1-L9">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../">« POMDPTools: the standard library for POMDPs.jl</a><a class="docs-footer-nextpage" href="../model/">Model Tools »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+rand(td) # will return a number near 2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/implicit.jl#L1-L32">source</a></section></article><h2 id="Bool-Distribution"><a class="docs-heading-anchor" href="#Bool-Distribution">Bool Distribution</a><a id="Bool-Distribution-1"></a><a class="docs-heading-anchor-permalink" href="#Bool-Distribution" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.BoolDistribution" href="#POMDPTools.POMDPDistributions.BoolDistribution"><code>POMDPTools.POMDPDistributions.BoolDistribution</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">BoolDistribution(p_true)</code></pre><p>Create a distribution over Boolean values (<code>true</code> or <code>false</code>).</p><p><code>p_true</code> is the probability of the <code>true</code> outcome; the probability of <code>false</code> is 1-<code>p_true</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/bool.jl#L1-L7">source</a></section></article><h2 id="Deterministic"><a class="docs-heading-anchor" href="#Deterministic">Deterministic</a><a id="Deterministic-1"></a><a class="docs-heading-anchor-permalink" href="#Deterministic" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.Deterministic" href="#POMDPTools.POMDPDistributions.Deterministic"><code>POMDPTools.POMDPDistributions.Deterministic</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">Deterministic(value)</code></pre><p>Create a deterministic distribution over only one value.</p><p>This is intended to be used when a distribution is required, but the outcome is deterministic. It is equivalent to a Kronecker Delta distribution.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/deterministic.jl#L1-L7">source</a></section></article><h2 id="Uniform"><a class="docs-heading-anchor" href="#Uniform">Uniform</a><a id="Uniform-1"></a><a class="docs-heading-anchor-permalink" href="#Uniform" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.Uniform" href="#POMDPTools.POMDPDistributions.Uniform"><code>POMDPTools.POMDPDistributions.Uniform</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">Uniform(collection)</code></pre><p>Create a uniform categorical distribution over a collection of objects.</p><p>The objects in the collection must be unique (this is tested on construction), and will be stored in a <code>Set</code>. To avoid this overhead, use <code>UnsafeUniform</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/uniform.jl#L5-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.UnsafeUniform" href="#POMDPTools.POMDPDistributions.UnsafeUniform"><code>POMDPTools.POMDPDistributions.UnsafeUniform</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">UnsafeUniform(collection)</code></pre><p>Create a uniform categorical distribution over a collection of objects.</p><p>No checks are performed to ensure uniqueness or check whether an object is actually in the set when evaluating the pdf.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/uniform.jl#L39-L45">source</a></section></article><h2 id="Pretty-Printing"><a class="docs-heading-anchor" href="#Pretty-Printing">Pretty Printing</a><a id="Pretty-Printing-1"></a><a class="docs-heading-anchor-permalink" href="#Pretty-Printing" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.POMDPDistributions.showdistribution" href="#POMDPTools.POMDPDistributions.showdistribution"><code>POMDPTools.POMDPDistributions.showdistribution</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">showdistribution([io], [mime], d)</code></pre><p>Show a UnicodePlots.barplot representation of a distribution.</p><p><strong>Keyword Arguments</strong></p><ul><li><code>title::String=string(typeof(d))*&quot; distribution&quot;</code>: title for the barplot. </li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/pretty_printing.jl#L1-L9">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../">« POMDPTools: the standard library for POMDPs.jl</a><a class="docs-footer-nextpage" href="../model/">Model Tools »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/index.html b/dev/POMDPTools/index.html
index 2b076ad3..129d4937 100644
--- a/dev/POMDPTools/index.html
+++ b/dev/POMDPTools/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>POMDPTools: the standard library for POMDPs.jl · POMDPs.jl</title><meta name="title" content="POMDPTools: the standard library for POMDPs.jl · POMDPs.jl"/><meta property="og:title" content="POMDPTools: the standard library for POMDPs.jl · POMDPs.jl"/><meta property="twitter:title" content="POMDPTools: the standard library for POMDPs.jl · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li class="is-active"><a class="tocitem" href>POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="model/">Model Tools</a></li><li><a class="tocitem" href="visualization/">Visualization</a></li><li><a class="tocitem" href="beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="policies/">Implemented Policies</a></li><li><a class="tocitem" href="simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>POMDPTools: the standard library for POMDPs.jl</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>POMDPTools: the standard library for POMDPs.jl</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/index.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="pomdptools_section"><a class="docs-heading-anchor" href="#pomdptools_section">POMDPTools: the standard library for POMDPs.jl</a><a id="pomdptools_section-1"></a><a class="docs-heading-anchor-permalink" href="#pomdptools_section" title="Permalink"></a></h1><p>The POMDPs.jl package does nothing more than define an <em>interface</em> or <em>language</em> for interacting with and solving (PO)MDPs; it does not contain any implementations. In practice, defining and solving POMDPs is made vastly easier if some commonly-used structures are provided. The POMDPTools package contains these implementations. Thus, the relationship between POMDPs.jl and POMDPTools is similar to the relationship between a programming language and its <a href="https://en.wikipedia.org/wiki/Standard_library">standard library</a>.</p><p>The POMDPTools package source code is hosted in <a href="https://github.com/JuliaPOMDP/POMDPs.jl/tree/master/lib/POMDPTools">the POMDPs.jl github repository in the <code>lib/POMDPTools</code> directory</a>.</p><p>The contents of the library are outlined below:</p><ul><li><a href="distributions/#Implemented-Distributions">Implemented Distributions</a></li><li class="no-marker"><ul><li><a href="distributions/#Sparse-Categorical-(SparseCat)">Sparse Categorical (<code>SparseCat</code>)</a></li><li><a href="distributions/#Implicit">Implicit</a></li><li><a href="distributions/#Bool-Distribution">Bool Distribution</a></li><li><a href="distributions/#Deterministic">Deterministic</a></li><li><a href="distributions/#Uniform">Uniform</a></li><li><a href="distributions/#Pretty-Printing">Pretty Printing</a></li></ul></li><li><a href="model/#Model-Tools">Model Tools</a></li><li class="no-marker"><ul><li><a href="model/#Interface-Extensions">Interface Extensions</a></li><li><a href="model/#Model-Transformations">Model Transformations</a></li><li><a href="model/#Utility-Types">Utility Types</a></li></ul></li><li><a href="visualization/#Visualization">Visualization</a></li><li><a href="beliefs/#Implemented-Belief-Updaters">Implemented Belief Updaters</a></li><li class="no-marker"><ul><li><a href="beliefs/#Discrete-(Bayesian-Filter)">Discrete (Bayesian Filter)</a></li><li><a href="beliefs/#K-Previous-Observations">K Previous Observations</a></li><li><a href="beliefs/#Previous-Observation">Previous Observation</a></li><li><a href="beliefs/#Nothing-Updater">Nothing Updater</a></li></ul></li><li><a href="policies/#Implemented-Policies">Implemented Policies</a></li><li class="no-marker"><ul><li><a href="policies/#Function">Function</a></li><li><a href="policies/#Alpha-Vector-Policy">Alpha Vector Policy</a></li><li><a href="policies/#Random-Policy">Random Policy</a></li><li><a href="policies/#Stochastic-Policies">Stochastic Policies</a></li><li><a href="policies/#Vector-Policies">Vector Policies</a></li><li><a href="policies/#Value-Dict-Policy">Value Dict Policy</a></li><li><a href="policies/#Exploration-Policies">Exploration Policies</a></li><li><a href="policies/#Playback-Policy">Playback Policy</a></li><li><a href="policies/#Utility-Wrapper">Utility Wrapper</a></li><li><a href="policies/#Pretty-Printing-Policies">Pretty Printing Policies</a></li></ul></li><li><a href="policies/#Policy-Evaluation">Policy Evaluation</a></li><li><a href="simulators/#Implemented-Simulators">Implemented Simulators</a></li><li class="no-marker"><ul><li><a href="simulators/#which_simulator">Which Simulator Should I Use?</a></li><li><a href="simulators/#Stepping-through">Stepping through</a></li><li><a href="simulators/#Rollouts">Rollouts</a></li><li><a href="simulators/#History-Recorder">History Recorder</a></li><li><a href="simulators/#sim-function"><code>sim()</code></a></li><li><a href="simulators/#Histories">Histories</a></li><li><a href="simulators/#Parallel">Parallel</a></li><li><a href="simulators/#Display">Display</a></li></ul></li><li><a href="common_rl/#CommonRLInterface-Integration">CommonRLInterface Integration</a></li><li class="no-marker"><ul><li><a href="common_rl/#Environment-Wrapper-Types">Environment Wrapper Types</a></li><li><a href="common_rl/#Constructors">Constructors</a></li></ul></li><li><a href="testing/#Testing">Testing</a></li><li class="no-marker"><ul><li><a href="testing/#Testing-(PO)MDP-Models">Testing (PO)MDP Models</a></li><li><a href="testing/#Testing-Solvers">Testing Solvers</a></li></ul></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../gallery/">« Gallery of POMDPs.jl Problems</a><a class="docs-footer-nextpage" href="distributions/">Implemented Distributions »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>POMDPTools: the standard library for POMDPs.jl · POMDPs.jl</title><meta name="title" content="POMDPTools: the standard library for POMDPs.jl · POMDPs.jl"/><meta property="og:title" content="POMDPTools: the standard library for POMDPs.jl · POMDPs.jl"/><meta property="twitter:title" content="POMDPTools: the standard library for POMDPs.jl · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li class="is-active"><a class="tocitem" href>POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="model/">Model Tools</a></li><li><a class="tocitem" href="visualization/">Visualization</a></li><li><a class="tocitem" href="beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="policies/">Implemented Policies</a></li><li><a class="tocitem" href="simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>POMDPTools: the standard library for POMDPs.jl</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>POMDPTools: the standard library for POMDPs.jl</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/index.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="pomdptools_section"><a class="docs-heading-anchor" href="#pomdptools_section">POMDPTools: the standard library for POMDPs.jl</a><a id="pomdptools_section-1"></a><a class="docs-heading-anchor-permalink" href="#pomdptools_section" title="Permalink"></a></h1><p>The POMDPs.jl package does nothing more than define an <em>interface</em> or <em>language</em> for interacting with and solving (PO)MDPs; it does not contain any implementations. In practice, defining and solving POMDPs is made vastly easier if some commonly-used structures are provided. The POMDPTools package contains these implementations. Thus, the relationship between POMDPs.jl and POMDPTools is similar to the relationship between a programming language and its <a href="https://en.wikipedia.org/wiki/Standard_library">standard library</a>.</p><p>The POMDPTools package source code is hosted in <a href="https://github.com/JuliaPOMDP/POMDPs.jl/tree/master/lib/POMDPTools">the POMDPs.jl github repository in the <code>lib/POMDPTools</code> directory</a>.</p><p>The contents of the library are outlined below:</p><ul><li><a href="distributions/#Implemented-Distributions">Implemented Distributions</a></li><li class="no-marker"><ul><li><a href="distributions/#Sparse-Categorical-(SparseCat)">Sparse Categorical (<code>SparseCat</code>)</a></li><li><a href="distributions/#Implicit">Implicit</a></li><li><a href="distributions/#Bool-Distribution">Bool Distribution</a></li><li><a href="distributions/#Deterministic">Deterministic</a></li><li><a href="distributions/#Uniform">Uniform</a></li><li><a href="distributions/#Pretty-Printing">Pretty Printing</a></li></ul></li><li><a href="model/#Model-Tools">Model Tools</a></li><li class="no-marker"><ul><li><a href="model/#Interface-Extensions">Interface Extensions</a></li><li><a href="model/#Model-Transformations">Model Transformations</a></li><li><a href="model/#Utility-Types">Utility Types</a></li></ul></li><li><a href="visualization/#Visualization">Visualization</a></li><li><a href="beliefs/#Implemented-Belief-Updaters">Implemented Belief Updaters</a></li><li class="no-marker"><ul><li><a href="beliefs/#Discrete-(Bayesian-Filter)">Discrete (Bayesian Filter)</a></li><li><a href="beliefs/#K-Previous-Observations">K Previous Observations</a></li><li><a href="beliefs/#Previous-Observation">Previous Observation</a></li><li><a href="beliefs/#Nothing-Updater">Nothing Updater</a></li></ul></li><li><a href="policies/#Implemented-Policies">Implemented Policies</a></li><li class="no-marker"><ul><li><a href="policies/#Function">Function</a></li><li><a href="policies/#Alpha-Vector-Policy">Alpha Vector Policy</a></li><li><a href="policies/#Random-Policy">Random Policy</a></li><li><a href="policies/#Stochastic-Policies">Stochastic Policies</a></li><li><a href="policies/#Vector-Policies">Vector Policies</a></li><li><a href="policies/#Value-Dict-Policy">Value Dict Policy</a></li><li><a href="policies/#Exploration-Policies">Exploration Policies</a></li><li><a href="policies/#Playback-Policy">Playback Policy</a></li><li><a href="policies/#Utility-Wrapper">Utility Wrapper</a></li><li><a href="policies/#Pretty-Printing-Policies">Pretty Printing Policies</a></li></ul></li><li><a href="policies/#Policy-Evaluation">Policy Evaluation</a></li><li><a href="simulators/#Implemented-Simulators">Implemented Simulators</a></li><li class="no-marker"><ul><li><a href="simulators/#which_simulator">Which Simulator Should I Use?</a></li><li><a href="simulators/#Stepping-through">Stepping through</a></li><li><a href="simulators/#Rollouts">Rollouts</a></li><li><a href="simulators/#History-Recorder">History Recorder</a></li><li><a href="simulators/#sim-function"><code>sim()</code></a></li><li><a href="simulators/#Histories">Histories</a></li><li><a href="simulators/#Parallel">Parallel</a></li><li><a href="simulators/#Display">Display</a></li></ul></li><li><a href="common_rl/#CommonRLInterface-Integration">CommonRLInterface Integration</a></li><li class="no-marker"><ul><li><a href="common_rl/#Environment-Wrapper-Types">Environment Wrapper Types</a></li><li><a href="common_rl/#Constructors">Constructors</a></li></ul></li><li><a href="testing/#Testing">Testing</a></li><li class="no-marker"><ul><li><a href="testing/#Testing-(PO)MDP-Models">Testing (PO)MDP Models</a></li><li><a href="testing/#Testing-Solvers">Testing Solvers</a></li></ul></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../gallery/">« Gallery of POMDPs.jl Problems</a><a class="docs-footer-nextpage" href="distributions/">Implemented Distributions »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/model/index.html b/dev/POMDPTools/model/index.html
index 80eb83ba..3507bc18 100644
--- a/dev/POMDPTools/model/index.html
+++ b/dev/POMDPTools/model/index.html
@@ -5,9 +5,9 @@
 julia&gt; collect(weighted_iterator(d))
 2-element Array{Pair{Bool,Float64},1}:
   true =&gt; 0.7
- false =&gt; 0.3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/POMDPDistributions/weighted_iteration.jl#L1-L18">source</a></section></article><h3 id="Observation-Weight"><a class="docs-heading-anchor" href="#Observation-Weight">Observation Weight</a><a id="Observation-Weight-1"></a><a class="docs-heading-anchor-permalink" href="#Observation-Weight" title="Permalink"></a></h3><p>Sometimes, e.g. in particle filtering, the relative likelihood of an observation is required in addition to a generative model, and it is often tedious to implement a custom observation distribution type. For this case, the shortcut function <code>obs_weight</code> is provided.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.obs_weight" href="#POMDPTools.ModelTools.obs_weight"><code>POMDPTools.ModelTools.obs_weight</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">obs_weight(pomdp, s, a, sp, o)</code></pre><p>Return a weight proportional to the likelihood of receiving observation o from state sp (and a and s if they are present).</p><p>This is a useful shortcut for particle filtering so that the observation distribution does not have to be represented.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/obs_weight.jl#L4-L10">source</a></section></article><h3 id="Ordered-Spaces"><a class="docs-heading-anchor" href="#Ordered-Spaces">Ordered Spaces</a><a id="Ordered-Spaces-1"></a><a class="docs-heading-anchor-permalink" href="#Ordered-Spaces" title="Permalink"></a></h3><p>It is often useful to have a list of states, actions, or observations ordered consistently with the respective <code>index</code> function from POMDPs.jl. Since the POMDPs.jl interface does not demand that spaces be ordered consistently with <code>index</code>, the <code>states</code>, <code>actions</code>, and <code>observations</code> functions are not sufficient. Thus POMDPModelTools provides <code>ordered_actions</code>, <code>ordered_states</code>, and <code>ordered_observations</code> to provide this capability.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.ordered_actions" href="#POMDPTools.ModelTools.ordered_actions"><code>POMDPTools.ModelTools.ordered_actions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">ordered_actions(mdp)</code></pre><p>Return an <code>AbstractVector</code> of actions ordered according to <code>actionindex(mdp, a)</code>.</p><p><code>ordered_actions(mdp)</code> will always return an <code>AbstractVector{A}</code> <code>v</code> containing all of the actions in <code>actions(mdp)</code> in the order such that <code>actionindex(mdp, v[i]) == i</code>. You may wish to override this for your problem for efficiency.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/ordered_spaces.jl#L3-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.ordered_states" href="#POMDPTools.ModelTools.ordered_states"><code>POMDPTools.ModelTools.ordered_states</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">ordered_states(mdp)</code></pre><p>Return an <code>AbstractVector</code> of states ordered according to <code>stateindex(mdp, a)</code>.</p><p><code>ordered_states(mdp)</code> will always return a <code>AbstractVector{A}</code> <code>v</code> containing all of the states in <code>states(mdp)</code> in the order such that <code>stateindex(mdp, v[i]) == i</code>. You may wish to override this for your problem for efficiency.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/ordered_spaces.jl#L12-L18">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.ordered_observations" href="#POMDPTools.ModelTools.ordered_observations"><code>POMDPTools.ModelTools.ordered_observations</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">ordered_observations(pomdp)</code></pre><p>Return an <code>AbstractVector</code> of observations ordered according to <code>obsindex(pomdp, a)</code>.</p><p><code>ordered_observations(mdp)</code> will always return a <code>AbstractVector{A}</code> <code>v</code> containing all of the observations in <code>observations(pomdp)</code> in the order such that <code>obsindex(pomdp, v[i]) == i</code>. You may wish to override this for your problem for efficiency.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/ordered_spaces.jl#L21-L27">source</a></section></article><h3 id="Info-Interface"><a class="docs-heading-anchor" href="#Info-Interface">Info Interface</a><a id="Info-Interface-1"></a><a class="docs-heading-anchor-permalink" href="#Info-Interface" title="Permalink"></a></h3><p>It is often the case that useful information besides the belief, state, action, etc is generated by a function in POMDPs.jl. This information can be useful for debugging or understanding the behavior of a solver, updater, or problem. The info interface provides a standard way for problems, policies, solvers or updaters to output this information. The recording simulators from <a href="../#pomdptools_section">POMDPTools</a> automatically record this information.</p><p>To specify info from policies, solvers, or updaters, implement the following functions:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.action_info" href="#POMDPTools.ModelTools.action_info"><code>POMDPTools.ModelTools.action_info</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">a, ai = action_info(policy, x)</code></pre><p>Return a tuple containing the action determined by policy &#39;p&#39; at state or belief &#39;x&#39; and information (usually a <code>NamedTuple</code>, <code>Dict</code> or <code>nothing</code>) from the calculation of that action.</p><p>By default, returns <code>nothing</code> as info.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/info.jl#L4-L10">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.solve_info" href="#POMDPTools.ModelTools.solve_info"><code>POMDPTools.ModelTools.solve_info</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">policy, si = solve_info(solver, problem)</code></pre><p>Return a tuple containing the policy determined by a solver and information (usually a <code>NamedTuple</code>, <code>Dict</code> or <code>nothing</code>) from the calculation of that policy.</p><p>By default, returns <code>nothing</code> as info.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/info.jl#L15-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.update_info" href="#POMDPTools.ModelTools.update_info"><code>POMDPTools.ModelTools.update_info</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">bp, i = update_info(updater, b, a, o)</code></pre><p>Return a tuple containing the new belief and information (usually a <code>NamedTuple</code>, <code>Dict</code> or <code>nothing</code>) from the belief update.</p><p>By default, returns <code>nothing</code> as info.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/info.jl#L26-L32">source</a></section></article><h2 id="Model-Transformations"><a class="docs-heading-anchor" href="#Model-Transformations">Model Transformations</a><a id="Model-Transformations-1"></a><a class="docs-heading-anchor-permalink" href="#Model-Transformations" title="Permalink"></a></h2><p>POMDPTools contains several tools for transforming problems into other classes so that they can be used by different solvers.</p><h3 id="Linear-Algebra-Representations"><a class="docs-heading-anchor" href="#Linear-Algebra-Representations">Linear Algebra Representations</a><a id="Linear-Algebra-Representations-1"></a><a class="docs-heading-anchor-permalink" href="#Linear-Algebra-Representations" title="Permalink"></a></h3><p>For some algorithms, such as value iteration, it is convenient to use vectors that contain the reward for every state, and matrices that contain the transition probabilities. These can be constructed with the following functions:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.transition_matrices" href="#POMDPTools.ModelTools.transition_matrices"><code>POMDPTools.ModelTools.transition_matrices</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">transition_matrices(p::SparseTabularProblem)</code></pre><p>Accessor function for the transition model of a sparse tabular problem. It returns a list of sparse matrices for each action of the problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L304-L309">source</a></section><section><div><pre><code class="language-julia hljs">transition_matrices(m::Union{MDP,POMDP})
-transition_matrices(m; sparse=true)</code></pre><p>Construct transition matrices for (PO)MDP m.</p><p>The returned object is an associative object (usually a Dict), where the keys are actions. Each value in this object is an AbstractMatrix where the row corresponds to the state index of s and the column corresponds to the state index of s&#39;. The entry in the matrix is the probability of transitioning from state s to state s&#39;.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/matrices.jl#L1-L8">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.reward_vectors" href="#POMDPTools.ModelTools.reward_vectors"><code>POMDPTools.ModelTools.reward_vectors</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward_vectors(m::Union{MDP, POMDP})</code></pre><p>Construct reward vectors for (PO)MDP m.</p><p>The returned object is an associative object (usually a Dict), where the keys are actions. Each value in this object is an AbstractVector where the index corresponds to the state index of s and the entry is the reward for that state.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/matrices.jl#L19-L25">source</a></section></article><h3 id="Sparse-Tabular-MDPs-and-POMDPs"><a class="docs-heading-anchor" href="#Sparse-Tabular-MDPs-and-POMDPs">Sparse Tabular MDPs and POMDPs</a><a id="Sparse-Tabular-MDPs-and-POMDPs-1"></a><a class="docs-heading-anchor-permalink" href="#Sparse-Tabular-MDPs-and-POMDPs" title="Permalink"></a></h3><p>The <code>SparseTabularMDP</code> and <code>SparseTabularPOMDP</code> represents discrete problems defined using the explicit interface. The transition and observation models are represented using sparse matrices. Solver writers can leverage these data structures to write efficient vectorized code. A problem writer can define its problem using the explicit interface and it can be automatically converted to a sparse tabular representation by calling the constructors <code>SparseTabularMDP(::MDP)</code> or <code>SparseTabularPOMDP(::POMDP)</code>. See the following docs to know more about the matrix representation and how to access the fields of the <code>SparseTabular</code> objects:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.SparseTabularMDP" href="#POMDPTools.ModelTools.SparseTabularMDP"><code>POMDPTools.ModelTools.SparseTabularMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SparseTabularMDP</code></pre><p>An MDP object where states and actions are integers and the transition is represented by a list of sparse matrices. This data structure can be useful to exploit in vectorized algorithm (e.g. see SparseValueIterationSolver). The recommended way to access the transition and reward matrices is through the provided accessor functions: <code>transition_matrix</code> and <code>reward_vector</code>.</p><p><strong>Fields</strong></p><ul><li><code>T::Vector{SparseMatrixCSC{Float64, Int64}}</code> The transition model is represented as a vector of sparse matrices (one for each action). <code>T[a][s, sp]</code> the probability of transition from <code>s</code> to <code>sp</code> taking action <code>a</code>.</li><li><code>R::Array{Float64, 2}</code> The reward is represented as a matrix where the rows are states and the columns actions: <code>R[s, a]</code> is the reward of taking action <code>a</code> in sate <code>s</code>.</li><li><code>initial_probs::SparseVector{Float64, Int64}</code> Specifies the initial state distribution</li><li><code>terminal_states::Set{Int64}</code> Stores the terminal states</li><li><code>discount::Float64</code> The discount factor</li></ul><p><strong>Constructors</strong></p><ul><li><code>SparseTabularMDP(mdp::MDP)</code> : One can provide the matrices to the default constructor or one can construct a <code>SparseTabularMDP</code> from any discrete state MDP defined using the explicit interface. </li></ul><p>Note that constructing the transition and reward matrices requires to iterate over all the states and can take a while. To learn more information about how to define an MDP with the explicit interface please visit https://juliapomdp.github.io/POMDPs.jl/latest/explicit/ .</p><ul><li><code>SparseTabularMDP(smdp::SparseTabularMDP; transition, reward, discount)</code> : This constructor returns a new sparse MDP that is a copy of the original smdp except for the field specified by the keyword arguments.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L1-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.SparseTabularPOMDP" href="#POMDPTools.ModelTools.SparseTabularPOMDP"><code>POMDPTools.ModelTools.SparseTabularPOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SparseTabularPOMDP</code></pre><p>A POMDP object where states and actions are integers and the transition and observation distributions are represented by lists of sparse matrices. This data structure can be useful to exploit in vectorized algorithms to gain performance (e.g. see SparseValueIterationSolver). The recommended way to access the transition, reward, and observation matrices is through the provided accessor functions: <code>transition_matrix</code>, <code>reward_vector</code>, <code>observation_matrix</code>.</p><p><strong>Fields</strong></p><ul><li><code>T::Vector{SparseMatrixCSC{Float64, Int64}}</code> The transition model is represented as a vector of sparse matrices (one for each action). <code>T[a][s, sp]</code> the probability of transition from <code>s</code> to <code>sp</code> taking action <code>a</code>.</li><li><code>R::Array{Float64, 2}</code> The reward is represented as a matrix where the rows are states and the columns actions: <code>R[s, a]</code> is the reward of taking action <code>a</code> in sate <code>s</code>.</li><li><code>O::Vector{SparseMatrixCSC{Float64, Int64}}</code> The observation model is represented as a vector of sparse matrices (one for each action). <code>O[a][sp, o]</code> is the probability of observing <code>o</code> from state <code>sp</code> after having taken action <code>a</code>.</li><li><code>initial_probs::SparseVector{Float64, Int64}</code> Specifies the initial state distribution</li><li><code>terminal_states::Set{Int64}</code> Stores the terminal states</li><li><code>discount::Float64</code> The discount factor</li></ul><p><strong>Constructors</strong></p><ul><li><code>SparseTabularPOMDP(pomdp::POMDP)</code> : One can provide the matrices to the default constructor or one can construct a <code>SparseTabularPOMDP</code> from any discrete state MDP defined using the explicit interface. </li></ul><p>Note that constructing the transition and reward matrices requires to iterate over all the states and can take a while. To learn more information about how to define an MDP with the explicit interface please visit https://juliapomdp.github.io/POMDPs.jl/latest/explicit/ .</p><ul><li><code>SparseTabularPOMDP(spomdp::SparseTabularMDP; transition, reward, observation, discount)</code> : This constructor returns a new sparse POMDP that is a copy of the original smdp except for the field specified by the keyword arguments.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L76-L99">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.transition_matrix" href="#POMDPTools.ModelTools.transition_matrix"><code>POMDPTools.ModelTools.transition_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">transition_matrix(p::SparseTabularProblem, a)</code></pre><p>Accessor function for the transition model of a sparse tabular problem. It returns a sparse matrix containing the transition probabilities when taking action a: T[s, sp] = Pr(sp | s, a).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L297-L301">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.reward_vector" href="#POMDPTools.ModelTools.reward_vector"><code>POMDPTools.ModelTools.reward_vector</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward_vector(p::SparseTabularProblem, a)</code></pre><p>Accessor function for the reward function of a sparse tabular problem. It returns a vector containing the reward for all the states when taking action a: R(s, a).  The length of the return vector is equal to the number of states.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L311-L316">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.observation_matrix" href="#POMDPTools.ModelTools.observation_matrix"><code>POMDPTools.ModelTools.observation_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observation_matrix(p::SparseTabularPOMDP, a::Int64)</code></pre><p>Accessor function for the observation model of a sparse tabular POMDP. It returns a sparse matrix containing the observation probabilities when having taken action a: O[sp, o] = Pr(o | sp, a).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L333-L337">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.reward_matrix" href="#POMDPTools.ModelTools.reward_matrix"><code>POMDPTools.ModelTools.reward_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward_matrix(p::SparseTabularProblem)</code></pre><p>Accessor function for the reward matrix R[s, a] of a sparse tabular problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L319-L323">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.observation_matrices" href="#POMDPTools.ModelTools.observation_matrices"><code>POMDPTools.ModelTools.observation_matrices</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observation_matrices(p::SparseTabularPOMDP)</code></pre><p>Accessor function for the observation model of a sparse tabular POMDP. It returns a list of sparse matrices for each action of the problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L340-L345">source</a></section></article><h3 id="Fully-Observable-POMDP"><a class="docs-heading-anchor" href="#Fully-Observable-POMDP">Fully Observable POMDP</a><a id="Fully-Observable-POMDP-1"></a><a class="docs-heading-anchor-permalink" href="#Fully-Observable-POMDP" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.FullyObservablePOMDP" href="#POMDPTools.ModelTools.FullyObservablePOMDP"><code>POMDPTools.ModelTools.FullyObservablePOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">FullyObservablePOMDP(mdp)</code></pre><p>Turn <code>MDP</code> <code>mdp</code> into a <code>POMDP</code> where the observations are the states of the MDP.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/fully_observable_pomdp.jl#L1-L5">source</a></section></article><h3 id="Generative-Belief-MDP"><a class="docs-heading-anchor" href="#Generative-Belief-MDP">Generative Belief MDP</a><a id="Generative-Belief-MDP-1"></a><a class="docs-heading-anchor-permalink" href="#Generative-Belief-MDP" title="Permalink"></a></h3><p>Every POMDP is an MDP on the belief space <code>GenerativeBeliefMDP</code> creates a generative model for that MDP.</p><div class="admonition is-warning"><header class="admonition-header">Warning</header><div class="admonition-body"><p>The reward generated by the <code>GenerativeBeliefMDP</code> is the reward for a <em>single state sampled from the belief</em>; it is not the   expected reward for that belief transition (though, in expectation, they are equivalent of course). Implementing the model with the expected reward requires a custom implementation because belief updaters do not typically deal with reward.</p></div></div><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.GenerativeBeliefMDP" href="#POMDPTools.ModelTools.GenerativeBeliefMDP"><code>POMDPTools.ModelTools.GenerativeBeliefMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">GenerativeBeliefMDP(pomdp, updater)
-GenerativeBeliefMDP(pomdp, updater; terminal_behavior=TerminalStateTerminalBehavior())</code></pre><p>Create a generative model of the belief MDP corresponding to POMDP <code>pomdp</code> with belief updates performed by <code>updater</code>. Each step is performed by sampling a state from the current belief, generating an observation from that state and action, and then using <code>updater</code> to update the belief.</p><p>A belief is considered terminal when <em>all</em> POMDP states in the support with nonzero probability are terminal.</p><p>The default behavior when a terminal POMDP state is sampled from the belief is to transition to <a href="#POMDPTools.ModelTools.terminalstate"><code>terminalstate</code></a>. This can be controlled by the <code>terminal_behavior</code> keyword argument. Using <code>terminal_behavior=ContinueTerminalBehavior(pomdp, updater)</code> will cause the MDP to keep attempting a belief update even when the sampled state is terminal. This can be further customized by providing <code>terminal_behavior</code> with a <code>Function</code> or callable object that takes arguments <code>b, s, a, rng</code> and returns a new belief (see the implementation of <code>ContinueTerminalBehavior</code> for an example). You can customize behavior additionally using <code>determine_gbmdp_state_type</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/generative_belief_mdp.jl#L1-L10">source</a></section></article><h4 id="Example"><a class="docs-heading-anchor" href="#Example">Example</a><a id="Example-1"></a><a class="docs-heading-anchor-permalink" href="#Example" title="Permalink"></a></h4><pre><code class="language-julia hljs">using POMDPs
+ false =&gt; 0.3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/POMDPDistributions/weighted_iteration.jl#L1-L18">source</a></section></article><h3 id="Observation-Weight"><a class="docs-heading-anchor" href="#Observation-Weight">Observation Weight</a><a id="Observation-Weight-1"></a><a class="docs-heading-anchor-permalink" href="#Observation-Weight" title="Permalink"></a></h3><p>Sometimes, e.g. in particle filtering, the relative likelihood of an observation is required in addition to a generative model, and it is often tedious to implement a custom observation distribution type. For this case, the shortcut function <code>obs_weight</code> is provided.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.obs_weight" href="#POMDPTools.ModelTools.obs_weight"><code>POMDPTools.ModelTools.obs_weight</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">obs_weight(pomdp, s, a, sp, o)</code></pre><p>Return a weight proportional to the likelihood of receiving observation o from state sp (and a and s if they are present).</p><p>This is a useful shortcut for particle filtering so that the observation distribution does not have to be represented.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/obs_weight.jl#L4-L10">source</a></section></article><h3 id="Ordered-Spaces"><a class="docs-heading-anchor" href="#Ordered-Spaces">Ordered Spaces</a><a id="Ordered-Spaces-1"></a><a class="docs-heading-anchor-permalink" href="#Ordered-Spaces" title="Permalink"></a></h3><p>It is often useful to have a list of states, actions, or observations ordered consistently with the respective <code>index</code> function from POMDPs.jl. Since the POMDPs.jl interface does not demand that spaces be ordered consistently with <code>index</code>, the <code>states</code>, <code>actions</code>, and <code>observations</code> functions are not sufficient. Thus POMDPModelTools provides <code>ordered_actions</code>, <code>ordered_states</code>, and <code>ordered_observations</code> to provide this capability.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.ordered_actions" href="#POMDPTools.ModelTools.ordered_actions"><code>POMDPTools.ModelTools.ordered_actions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">ordered_actions(mdp)</code></pre><p>Return an <code>AbstractVector</code> of actions ordered according to <code>actionindex(mdp, a)</code>.</p><p><code>ordered_actions(mdp)</code> will always return an <code>AbstractVector{A}</code> <code>v</code> containing all of the actions in <code>actions(mdp)</code> in the order such that <code>actionindex(mdp, v[i]) == i</code>. You may wish to override this for your problem for efficiency.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/ordered_spaces.jl#L3-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.ordered_states" href="#POMDPTools.ModelTools.ordered_states"><code>POMDPTools.ModelTools.ordered_states</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">ordered_states(mdp)</code></pre><p>Return an <code>AbstractVector</code> of states ordered according to <code>stateindex(mdp, a)</code>.</p><p><code>ordered_states(mdp)</code> will always return a <code>AbstractVector{A}</code> <code>v</code> containing all of the states in <code>states(mdp)</code> in the order such that <code>stateindex(mdp, v[i]) == i</code>. You may wish to override this for your problem for efficiency.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/ordered_spaces.jl#L12-L18">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.ordered_observations" href="#POMDPTools.ModelTools.ordered_observations"><code>POMDPTools.ModelTools.ordered_observations</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">ordered_observations(pomdp)</code></pre><p>Return an <code>AbstractVector</code> of observations ordered according to <code>obsindex(pomdp, a)</code>.</p><p><code>ordered_observations(mdp)</code> will always return a <code>AbstractVector{A}</code> <code>v</code> containing all of the observations in <code>observations(pomdp)</code> in the order such that <code>obsindex(pomdp, v[i]) == i</code>. You may wish to override this for your problem for efficiency.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/ordered_spaces.jl#L21-L27">source</a></section></article><h3 id="Info-Interface"><a class="docs-heading-anchor" href="#Info-Interface">Info Interface</a><a id="Info-Interface-1"></a><a class="docs-heading-anchor-permalink" href="#Info-Interface" title="Permalink"></a></h3><p>It is often the case that useful information besides the belief, state, action, etc is generated by a function in POMDPs.jl. This information can be useful for debugging or understanding the behavior of a solver, updater, or problem. The info interface provides a standard way for problems, policies, solvers or updaters to output this information. The recording simulators from <a href="../#pomdptools_section">POMDPTools</a> automatically record this information.</p><p>To specify info from policies, solvers, or updaters, implement the following functions:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.action_info" href="#POMDPTools.ModelTools.action_info"><code>POMDPTools.ModelTools.action_info</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">a, ai = action_info(policy, x)</code></pre><p>Return a tuple containing the action determined by policy &#39;p&#39; at state or belief &#39;x&#39; and information (usually a <code>NamedTuple</code>, <code>Dict</code> or <code>nothing</code>) from the calculation of that action.</p><p>By default, returns <code>nothing</code> as info.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/info.jl#L4-L10">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.solve_info" href="#POMDPTools.ModelTools.solve_info"><code>POMDPTools.ModelTools.solve_info</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">policy, si = solve_info(solver, problem)</code></pre><p>Return a tuple containing the policy determined by a solver and information (usually a <code>NamedTuple</code>, <code>Dict</code> or <code>nothing</code>) from the calculation of that policy.</p><p>By default, returns <code>nothing</code> as info.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/info.jl#L15-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.update_info" href="#POMDPTools.ModelTools.update_info"><code>POMDPTools.ModelTools.update_info</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">bp, i = update_info(updater, b, a, o)</code></pre><p>Return a tuple containing the new belief and information (usually a <code>NamedTuple</code>, <code>Dict</code> or <code>nothing</code>) from the belief update.</p><p>By default, returns <code>nothing</code> as info.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/info.jl#L26-L32">source</a></section></article><h2 id="Model-Transformations"><a class="docs-heading-anchor" href="#Model-Transformations">Model Transformations</a><a id="Model-Transformations-1"></a><a class="docs-heading-anchor-permalink" href="#Model-Transformations" title="Permalink"></a></h2><p>POMDPTools contains several tools for transforming problems into other classes so that they can be used by different solvers.</p><h3 id="Linear-Algebra-Representations"><a class="docs-heading-anchor" href="#Linear-Algebra-Representations">Linear Algebra Representations</a><a id="Linear-Algebra-Representations-1"></a><a class="docs-heading-anchor-permalink" href="#Linear-Algebra-Representations" title="Permalink"></a></h3><p>For some algorithms, such as value iteration, it is convenient to use vectors that contain the reward for every state, and matrices that contain the transition probabilities. These can be constructed with the following functions:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.transition_matrices" href="#POMDPTools.ModelTools.transition_matrices"><code>POMDPTools.ModelTools.transition_matrices</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">transition_matrices(p::SparseTabularProblem)</code></pre><p>Accessor function for the transition model of a sparse tabular problem. It returns a list of sparse matrices for each action of the problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L304-L309">source</a></section><section><div><pre><code class="language-julia hljs">transition_matrices(m::Union{MDP,POMDP})
+transition_matrices(m; sparse=true)</code></pre><p>Construct transition matrices for (PO)MDP m.</p><p>The returned object is an associative object (usually a Dict), where the keys are actions. Each value in this object is an AbstractMatrix where the row corresponds to the state index of s and the column corresponds to the state index of s&#39;. The entry in the matrix is the probability of transitioning from state s to state s&#39;.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/matrices.jl#L1-L8">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.reward_vectors" href="#POMDPTools.ModelTools.reward_vectors"><code>POMDPTools.ModelTools.reward_vectors</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward_vectors(m::Union{MDP, POMDP})</code></pre><p>Construct reward vectors for (PO)MDP m.</p><p>The returned object is an associative object (usually a Dict), where the keys are actions. Each value in this object is an AbstractVector where the index corresponds to the state index of s and the entry is the reward for that state.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/matrices.jl#L19-L25">source</a></section></article><h3 id="Sparse-Tabular-MDPs-and-POMDPs"><a class="docs-heading-anchor" href="#Sparse-Tabular-MDPs-and-POMDPs">Sparse Tabular MDPs and POMDPs</a><a id="Sparse-Tabular-MDPs-and-POMDPs-1"></a><a class="docs-heading-anchor-permalink" href="#Sparse-Tabular-MDPs-and-POMDPs" title="Permalink"></a></h3><p>The <code>SparseTabularMDP</code> and <code>SparseTabularPOMDP</code> represents discrete problems defined using the explicit interface. The transition and observation models are represented using sparse matrices. Solver writers can leverage these data structures to write efficient vectorized code. A problem writer can define its problem using the explicit interface and it can be automatically converted to a sparse tabular representation by calling the constructors <code>SparseTabularMDP(::MDP)</code> or <code>SparseTabularPOMDP(::POMDP)</code>. See the following docs to know more about the matrix representation and how to access the fields of the <code>SparseTabular</code> objects:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.SparseTabularMDP" href="#POMDPTools.ModelTools.SparseTabularMDP"><code>POMDPTools.ModelTools.SparseTabularMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SparseTabularMDP</code></pre><p>An MDP object where states and actions are integers and the transition is represented by a list of sparse matrices. This data structure can be useful to exploit in vectorized algorithm (e.g. see SparseValueIterationSolver). The recommended way to access the transition and reward matrices is through the provided accessor functions: <code>transition_matrix</code> and <code>reward_vector</code>.</p><p><strong>Fields</strong></p><ul><li><code>T::Vector{SparseMatrixCSC{Float64, Int64}}</code> The transition model is represented as a vector of sparse matrices (one for each action). <code>T[a][s, sp]</code> the probability of transition from <code>s</code> to <code>sp</code> taking action <code>a</code>.</li><li><code>R::Array{Float64, 2}</code> The reward is represented as a matrix where the rows are states and the columns actions: <code>R[s, a]</code> is the reward of taking action <code>a</code> in sate <code>s</code>.</li><li><code>initial_probs::SparseVector{Float64, Int64}</code> Specifies the initial state distribution</li><li><code>terminal_states::Set{Int64}</code> Stores the terminal states</li><li><code>discount::Float64</code> The discount factor</li></ul><p><strong>Constructors</strong></p><ul><li><code>SparseTabularMDP(mdp::MDP)</code> : One can provide the matrices to the default constructor or one can construct a <code>SparseTabularMDP</code> from any discrete state MDP defined using the explicit interface. </li></ul><p>Note that constructing the transition and reward matrices requires to iterate over all the states and can take a while. To learn more information about how to define an MDP with the explicit interface please visit https://juliapomdp.github.io/POMDPs.jl/latest/explicit/ .</p><ul><li><code>SparseTabularMDP(smdp::SparseTabularMDP; transition, reward, discount)</code> : This constructor returns a new sparse MDP that is a copy of the original smdp except for the field specified by the keyword arguments.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L1-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.SparseTabularPOMDP" href="#POMDPTools.ModelTools.SparseTabularPOMDP"><code>POMDPTools.ModelTools.SparseTabularPOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SparseTabularPOMDP</code></pre><p>A POMDP object where states and actions are integers and the transition and observation distributions are represented by lists of sparse matrices. This data structure can be useful to exploit in vectorized algorithms to gain performance (e.g. see SparseValueIterationSolver). The recommended way to access the transition, reward, and observation matrices is through the provided accessor functions: <code>transition_matrix</code>, <code>reward_vector</code>, <code>observation_matrix</code>.</p><p><strong>Fields</strong></p><ul><li><code>T::Vector{SparseMatrixCSC{Float64, Int64}}</code> The transition model is represented as a vector of sparse matrices (one for each action). <code>T[a][s, sp]</code> the probability of transition from <code>s</code> to <code>sp</code> taking action <code>a</code>.</li><li><code>R::Array{Float64, 2}</code> The reward is represented as a matrix where the rows are states and the columns actions: <code>R[s, a]</code> is the reward of taking action <code>a</code> in sate <code>s</code>.</li><li><code>O::Vector{SparseMatrixCSC{Float64, Int64}}</code> The observation model is represented as a vector of sparse matrices (one for each action). <code>O[a][sp, o]</code> is the probability of observing <code>o</code> from state <code>sp</code> after having taken action <code>a</code>.</li><li><code>initial_probs::SparseVector{Float64, Int64}</code> Specifies the initial state distribution</li><li><code>terminal_states::Set{Int64}</code> Stores the terminal states</li><li><code>discount::Float64</code> The discount factor</li></ul><p><strong>Constructors</strong></p><ul><li><code>SparseTabularPOMDP(pomdp::POMDP)</code> : One can provide the matrices to the default constructor or one can construct a <code>SparseTabularPOMDP</code> from any discrete state MDP defined using the explicit interface. </li></ul><p>Note that constructing the transition and reward matrices requires to iterate over all the states and can take a while. To learn more information about how to define an MDP with the explicit interface please visit https://juliapomdp.github.io/POMDPs.jl/latest/explicit/ .</p><ul><li><code>SparseTabularPOMDP(spomdp::SparseTabularMDP; transition, reward, observation, discount)</code> : This constructor returns a new sparse POMDP that is a copy of the original smdp except for the field specified by the keyword arguments.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L76-L99">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.transition_matrix" href="#POMDPTools.ModelTools.transition_matrix"><code>POMDPTools.ModelTools.transition_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">transition_matrix(p::SparseTabularProblem, a)</code></pre><p>Accessor function for the transition model of a sparse tabular problem. It returns a sparse matrix containing the transition probabilities when taking action a: T[s, sp] = Pr(sp | s, a).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L297-L301">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.reward_vector" href="#POMDPTools.ModelTools.reward_vector"><code>POMDPTools.ModelTools.reward_vector</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward_vector(p::SparseTabularProblem, a)</code></pre><p>Accessor function for the reward function of a sparse tabular problem. It returns a vector containing the reward for all the states when taking action a: R(s, a).  The length of the return vector is equal to the number of states.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L311-L316">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.observation_matrix" href="#POMDPTools.ModelTools.observation_matrix"><code>POMDPTools.ModelTools.observation_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observation_matrix(p::SparseTabularPOMDP, a::Int64)</code></pre><p>Accessor function for the observation model of a sparse tabular POMDP. It returns a sparse matrix containing the observation probabilities when having taken action a: O[sp, o] = Pr(o | sp, a).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L333-L337">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.reward_matrix" href="#POMDPTools.ModelTools.reward_matrix"><code>POMDPTools.ModelTools.reward_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward_matrix(p::SparseTabularProblem)</code></pre><p>Accessor function for the reward matrix R[s, a] of a sparse tabular problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L319-L323">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.observation_matrices" href="#POMDPTools.ModelTools.observation_matrices"><code>POMDPTools.ModelTools.observation_matrices</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observation_matrices(p::SparseTabularPOMDP)</code></pre><p>Accessor function for the observation model of a sparse tabular POMDP. It returns a list of sparse matrices for each action of the problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/sparse_tabular.jl#L340-L345">source</a></section></article><h3 id="Fully-Observable-POMDP"><a class="docs-heading-anchor" href="#Fully-Observable-POMDP">Fully Observable POMDP</a><a id="Fully-Observable-POMDP-1"></a><a class="docs-heading-anchor-permalink" href="#Fully-Observable-POMDP" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.FullyObservablePOMDP" href="#POMDPTools.ModelTools.FullyObservablePOMDP"><code>POMDPTools.ModelTools.FullyObservablePOMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">FullyObservablePOMDP(mdp)</code></pre><p>Turn <code>MDP</code> <code>mdp</code> into a <code>POMDP</code> where the observations are the states of the MDP.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/fully_observable_pomdp.jl#L1-L5">source</a></section></article><h3 id="Generative-Belief-MDP"><a class="docs-heading-anchor" href="#Generative-Belief-MDP">Generative Belief MDP</a><a id="Generative-Belief-MDP-1"></a><a class="docs-heading-anchor-permalink" href="#Generative-Belief-MDP" title="Permalink"></a></h3><p>Every POMDP is an MDP on the belief space <code>GenerativeBeliefMDP</code> creates a generative model for that MDP.</p><div class="admonition is-warning"><header class="admonition-header">Warning</header><div class="admonition-body"><p>The reward generated by the <code>GenerativeBeliefMDP</code> is the reward for a <em>single state sampled from the belief</em>; it is not the   expected reward for that belief transition (though, in expectation, they are equivalent of course). Implementing the model with the expected reward requires a custom implementation because belief updaters do not typically deal with reward.</p></div></div><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.GenerativeBeliefMDP" href="#POMDPTools.ModelTools.GenerativeBeliefMDP"><code>POMDPTools.ModelTools.GenerativeBeliefMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">GenerativeBeliefMDP(pomdp, updater)
+GenerativeBeliefMDP(pomdp, updater; terminal_behavior=TerminalStateTerminalBehavior())</code></pre><p>Create a generative model of the belief MDP corresponding to POMDP <code>pomdp</code> with belief updates performed by <code>updater</code>. Each step is performed by sampling a state from the current belief, generating an observation from that state and action, and then using <code>updater</code> to update the belief.</p><p>A belief is considered terminal when <em>all</em> POMDP states in the support with nonzero probability are terminal.</p><p>The default behavior when a terminal POMDP state is sampled from the belief is to transition to <a href="#POMDPTools.ModelTools.terminalstate"><code>terminalstate</code></a>. This can be controlled by the <code>terminal_behavior</code> keyword argument. Using <code>terminal_behavior=ContinueTerminalBehavior(pomdp, updater)</code> will cause the MDP to keep attempting a belief update even when the sampled state is terminal. This can be further customized by providing <code>terminal_behavior</code> with a <code>Function</code> or callable object that takes arguments <code>b, s, a, rng</code> and returns a new belief (see the implementation of <code>ContinueTerminalBehavior</code> for an example). You can customize behavior additionally using <code>determine_gbmdp_state_type</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/generative_belief_mdp.jl#L1-L10">source</a></section></article><h4 id="Example"><a class="docs-heading-anchor" href="#Example">Example</a><a id="Example-1"></a><a class="docs-heading-anchor-permalink" href="#Example" title="Permalink"></a></h4><pre><code class="language-julia hljs">using POMDPs
 using POMDPModels
 using POMDPTools
 
@@ -27,7 +27,7 @@
 (a, r, sp) = (true, -5.0, DiscreteBelief{POMDPModels.BabyPOMDP, Bool}(POMDPModels.BabyPOMDP(-5.0, -10.0, 0.1, 0.8, 0.1, 0.9), Bool[0, 1], [1.0, 0.0]))
 (a, r, sp) = (true, -5.0, DiscreteBelief{POMDPModels.BabyPOMDP, Bool}(POMDPModels.BabyPOMDP(-5.0, -10.0, 0.1, 0.8, 0.1, 0.9), Bool[0, 1], [1.0, 0.0]))
 (a, r, sp) = (false, 0.0, DiscreteBelief{POMDPModels.BabyPOMDP, Bool}(POMDPModels.BabyPOMDP(-5.0, -10.0, 0.1, 0.8, 0.1, 0.9), Bool[0, 1], [0.9759036144578314, 0.02409638554216867]))
-(a, r, sp) = (false, 0.0, DiscreteBelief{POMDPModels.BabyPOMDP, Bool}(POMDPModels.BabyPOMDP(-5.0, -10.0, 0.1, 0.8, 0.1, 0.9), Bool[0, 1], [0.9701315984030756, 0.029868401596924433]))</code></pre><h3 id="Underlying-MDP"><a class="docs-heading-anchor" href="#Underlying-MDP">Underlying MDP</a><a id="Underlying-MDP-1"></a><a class="docs-heading-anchor-permalink" href="#Underlying-MDP" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.UnderlyingMDP" href="#POMDPTools.ModelTools.UnderlyingMDP"><code>POMDPTools.ModelTools.UnderlyingMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">UnderlyingMDP(m::POMDP)</code></pre><p>Transform <code>POMDP</code> <code>m</code> into an <code>MDP</code> where the states are fully observed.</p><pre><code class="nohighlight hljs">UnderlyingMDP(m::MDP)</code></pre><p>Return <code>m</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/underlying_mdp.jl#L1-L9">source</a></section></article><h3 id="State-Action-Reward-Model"><a class="docs-heading-anchor" href="#State-Action-Reward-Model">State Action Reward Model</a><a id="State-Action-Reward-Model-1"></a><a class="docs-heading-anchor-permalink" href="#State-Action-Reward-Model" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.StateActionReward" href="#POMDPTools.ModelTools.StateActionReward"><code>POMDPTools.ModelTools.StateActionReward</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">StateActionReward(m::Union{MDP,POMDP})</code></pre><p>Robustly create a reward function that depends only on the state and action.</p><p>If <code>reward(m, s, a)</code> is implemented, that will be used, otherwise the mean of <code>reward(m, s, a, sp)</code> for MDPs or <code>reward(m, s, a, sp, o)</code> for POMDPs will be used.</p><p><strong>Example</strong></p><pre><code class="language-julia hljs">using POMDPs
+(a, r, sp) = (false, 0.0, DiscreteBelief{POMDPModels.BabyPOMDP, Bool}(POMDPModels.BabyPOMDP(-5.0, -10.0, 0.1, 0.8, 0.1, 0.9), Bool[0, 1], [0.9701315984030756, 0.029868401596924433]))</code></pre><h3 id="Underlying-MDP"><a class="docs-heading-anchor" href="#Underlying-MDP">Underlying MDP</a><a id="Underlying-MDP-1"></a><a class="docs-heading-anchor-permalink" href="#Underlying-MDP" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.UnderlyingMDP" href="#POMDPTools.ModelTools.UnderlyingMDP"><code>POMDPTools.ModelTools.UnderlyingMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">UnderlyingMDP(m::POMDP)</code></pre><p>Transform <code>POMDP</code> <code>m</code> into an <code>MDP</code> where the states are fully observed.</p><pre><code class="nohighlight hljs">UnderlyingMDP(m::MDP)</code></pre><p>Return <code>m</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/underlying_mdp.jl#L1-L9">source</a></section></article><h3 id="State-Action-Reward-Model"><a class="docs-heading-anchor" href="#State-Action-Reward-Model">State Action Reward Model</a><a id="State-Action-Reward-Model-1"></a><a class="docs-heading-anchor-permalink" href="#State-Action-Reward-Model" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.StateActionReward" href="#POMDPTools.ModelTools.StateActionReward"><code>POMDPTools.ModelTools.StateActionReward</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">StateActionReward(m::Union{MDP,POMDP})</code></pre><p>Robustly create a reward function that depends only on the state and action.</p><p>If <code>reward(m, s, a)</code> is implemented, that will be used, otherwise the mean of <code>reward(m, s, a, sp)</code> for MDPs or <code>reward(m, s, a, sp, o)</code> for POMDPs will be used.</p><p><strong>Example</strong></p><pre><code class="language-julia hljs">using POMDPs
 using POMDPModels
 using POMDPTools
 
@@ -39,4 +39,4 @@
 
 # output
 
--15.0</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/state_action_reward.jl#L1-L24">source</a></section></article><h2 id="Utility-Types"><a class="docs-heading-anchor" href="#Utility-Types">Utility Types</a><a id="Utility-Types-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-Types" title="Permalink"></a></h2><h3 id="Terminal-State"><a class="docs-heading-anchor" href="#Terminal-State">Terminal State</a><a id="Terminal-State-1"></a><a class="docs-heading-anchor-permalink" href="#Terminal-State" title="Permalink"></a></h3><p><code>TerminalState</code> and its singleton instance <code>terminalstate</code> are available to use for a terminal state in concert with another state type. It has the appropriate type promotion logic to make its use with other types friendly, similar to <code>nothing</code> and <code>missing</code>.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>NOTE: This is NOT a replacement for the standard POMDPs.jl isterminal function, though isterminal is implemented for the type. It is merely a convenient type to use for terminal states.</p></div></div><div class="admonition is-warning"><header class="admonition-header">Warning</header><div class="admonition-body"><p>WARNING: Early tests (August 2018) suggest that the Julia 1.0 compiler will not be able to efficiently implement union splitting in cases as  complex as POMDPs, so using a <code>Union</code> for the state type of a problem can currently have a large overhead.</p></div></div><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.TerminalState" href="#POMDPTools.ModelTools.TerminalState"><code>POMDPTools.ModelTools.TerminalState</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">TerminalState</code></pre><p>A type with no fields whose singleton instance <code>terminalstate</code> is used to represent a terminal state with no additional information.</p><p>This type has the appropriate promotion logic implemented to function like <code>Missing</code> when added to arrays, etc.</p><p>Note that terminal states NEED NOT be of type <code>TerminalState</code>. You can define any state to be terminal by implementing the appropriate <code>isterminal</code> method. Solvers and simulators SHOULD NOT check for this type, but should instead check using <code>isterminal</code>. </p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/terminal_state.jl#L1-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.terminalstate" href="#POMDPTools.ModelTools.terminalstate"><code>POMDPTools.ModelTools.terminalstate</code></a> — <span class="docstring-category">Constant</span></header><section><div><pre><code class="language-julia hljs">terminalstate</code></pre><p>The singleton instance of type <a href="#POMDPTools.ModelTools.TerminalState"><code>TerminalState</code></a> representing a terminal state.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/terminal_state.jl#L12-L16">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../distributions/">« Implemented Distributions</a><a class="docs-footer-nextpage" href="../visualization/">Visualization »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+-15.0</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/state_action_reward.jl#L1-L24">source</a></section></article><h2 id="Utility-Types"><a class="docs-heading-anchor" href="#Utility-Types">Utility Types</a><a id="Utility-Types-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-Types" title="Permalink"></a></h2><h3 id="Terminal-State"><a class="docs-heading-anchor" href="#Terminal-State">Terminal State</a><a id="Terminal-State-1"></a><a class="docs-heading-anchor-permalink" href="#Terminal-State" title="Permalink"></a></h3><p><code>TerminalState</code> and its singleton instance <code>terminalstate</code> are available to use for a terminal state in concert with another state type. It has the appropriate type promotion logic to make its use with other types friendly, similar to <code>nothing</code> and <code>missing</code>.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>NOTE: This is NOT a replacement for the standard POMDPs.jl isterminal function, though isterminal is implemented for the type. It is merely a convenient type to use for terminal states.</p></div></div><div class="admonition is-warning"><header class="admonition-header">Warning</header><div class="admonition-body"><p>WARNING: Early tests (August 2018) suggest that the Julia 1.0 compiler will not be able to efficiently implement union splitting in cases as  complex as POMDPs, so using a <code>Union</code> for the state type of a problem can currently have a large overhead.</p></div></div><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.TerminalState" href="#POMDPTools.ModelTools.TerminalState"><code>POMDPTools.ModelTools.TerminalState</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">TerminalState</code></pre><p>A type with no fields whose singleton instance <code>terminalstate</code> is used to represent a terminal state with no additional information.</p><p>This type has the appropriate promotion logic implemented to function like <code>Missing</code> when added to arrays, etc.</p><p>Note that terminal states NEED NOT be of type <code>TerminalState</code>. You can define any state to be terminal by implementing the appropriate <code>isterminal</code> method. Solvers and simulators SHOULD NOT check for this type, but should instead check using <code>isterminal</code>. </p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/terminal_state.jl#L1-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.terminalstate" href="#POMDPTools.ModelTools.terminalstate"><code>POMDPTools.ModelTools.terminalstate</code></a> — <span class="docstring-category">Constant</span></header><section><div><pre><code class="language-julia hljs">terminalstate</code></pre><p>The singleton instance of type <a href="#POMDPTools.ModelTools.TerminalState"><code>TerminalState</code></a> representing a terminal state.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/terminal_state.jl#L12-L16">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../distributions/">« Implemented Distributions</a><a class="docs-footer-nextpage" href="../visualization/">Visualization »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/policies/index.html b/dev/POMDPTools/policies/index.html
index 9d9d434e..b372bc34 100644
--- a/dev/POMDPTools/policies/index.html
+++ b/dev/POMDPTools/policies/index.html
@@ -1,8 +1,8 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Implemented Policies · POMDPs.jl</title><meta name="title" content="Implemented Policies · POMDPs.jl"/><meta property="og:title" content="Implemented Policies · POMDPs.jl"/><meta property="twitter:title" content="Implemented Policies · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li><a class="tocitem" href="../visualization/">Visualization</a></li><li><a class="tocitem" href="../beliefs/">Implemented Belief Updaters</a></li><li class="is-active"><a class="tocitem" href>Implemented Policies</a><ul class="internal"><li><a class="tocitem" href="#Function"><span>Function</span></a></li><li><a class="tocitem" href="#Alpha-Vector-Policy"><span>Alpha Vector Policy</span></a></li><li><a class="tocitem" href="#Random-Policy"><span>Random Policy</span></a></li><li><a class="tocitem" href="#Stochastic-Policies"><span>Stochastic Policies</span></a></li><li><a class="tocitem" href="#Vector-Policies"><span>Vector Policies</span></a></li><li><a class="tocitem" href="#Value-Dict-Policy"><span>Value Dict Policy</span></a></li><li><a class="tocitem" href="#Exploration-Policies"><span>Exploration Policies</span></a></li><li><a class="tocitem" href="#Playback-Policy"><span>Playback Policy</span></a></li><li><a class="tocitem" href="#Utility-Wrapper"><span>Utility Wrapper</span></a></li><li><a class="tocitem" href="#Pretty-Printing-Policies"><span>Pretty Printing Policies</span></a></li><li class="toplevel"><a class="tocitem" href="#Policy-Evaluation"><span>Policy Evaluation</span></a></li></ul></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Implemented Policies</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Implemented Policies</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/policies.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Implemented-Policies"><a class="docs-heading-anchor" href="#Implemented-Policies">Implemented Policies</a><a id="Implemented-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Implemented-Policies" title="Permalink"></a></h1><p>POMDPTools currently provides the following policy types:</p><ul><li>a wrapper to turn a function into a <code>Policy</code></li><li>an alpha vector policy type</li><li>a random policy</li><li>a stochastic policy type</li><li>exploration policies</li><li>a vector policy type</li><li>a wrapper to collect statistics and errors about policies</li></ul><p>In addition, it provides the <a href="#POMDPTools.Policies.showpolicy"><code>showpolicy</code></a> function for printing policies similar to the way that matrices are printed in the repl and the <a href="#POMDPTools.Policies.evaluate"><code>evaluate</code></a> function for evaluating MDP policies.</p><h2 id="Function"><a class="docs-heading-anchor" href="#Function">Function</a><a id="Function-1"></a><a class="docs-heading-anchor-permalink" href="#Function" title="Permalink"></a></h2><p>Wraps a <code>Function</code> mapping states to actions into a <code>Policy</code>. </p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.FunctionPolicy" href="#POMDPTools.Policies.FunctionPolicy"><code>POMDPTools.Policies.FunctionPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><p>FunctionPolicy</p><p>Policy <code>p=FunctionPolicy(f)</code> returns <code>f(x)</code> when <code>action(p, x)</code> is called.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/function.jl#L5-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.FunctionSolver" href="#POMDPTools.Policies.FunctionSolver"><code>POMDPTools.Policies.FunctionSolver</code></a> — <span class="docstring-category">Type</span></header><section><div><p>FunctionSolver</p><p>Solver for a FunctionPolicy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/function.jl#L14-L18">source</a></section></article><h2 id="Alpha-Vector-Policy"><a class="docs-heading-anchor" href="#Alpha-Vector-Policy">Alpha Vector Policy</a><a id="Alpha-Vector-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Alpha-Vector-Policy" title="Permalink"></a></h2><p>Represents a policy with a set of alpha vectors (See <code>AlphaVectorPolicy</code> constructor docstring). In addition to finding the optimal action with <code>action</code>, the alpha vectors can be accessed with <a href="#POMDPTools.Policies.alphavectors"><code>alphavectors</code></a> or <a href="#POMDPTools.Policies.alphapairs"><code>alphapairs</code></a>.</p><p>Determining the estimated value and optimal action depends on calculating the dot product between alpha vectors and a belief vector. <a href="#POMDPTools.Policies.beliefvec"><code>POMDPTools.Policies.beliefvec(pomdp, b)</code></a> is used to create this vector and can be overridden for new belief types for efficiency.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.AlphaVectorPolicy" href="#POMDPTools.Policies.AlphaVectorPolicy"><code>POMDPTools.Policies.AlphaVectorPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">AlphaVectorPolicy(pomdp::POMDP, alphas, action_map)</code></pre><p>Construct a policy from alpha vectors.</p><p><strong>Arguments</strong></p><ul><li><p><code>alphas</code>: an |S| x (number of alpha vecs) matrix or a vector of alpha vectors.</p></li><li><p><code>action_map</code>: a vector of the actions correponding to each alpha vector</p><p>AlphaVectorPolicy{P&lt;:POMDP, A}</p></li></ul><p>Represents a policy with a set of alpha vectors.</p><p>Use <code>action</code> to get the best action for a belief, and <code>alphavectors</code> and <code>alphapairs</code> to </p><p><strong>Fields</strong></p><ul><li><code>pomdp::P</code> the POMDP problem </li><li><code>n_states::Int</code> the number of states in the POMDP</li><li><code>alphas::Vector{Vector{Float64}}</code> the list of alpha vectors</li><li><code>action_map::Vector{A}</code> a list of action corresponding to the alpha vectors</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/alpha_vector.jl#L1-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.alphavectors" href="#POMDPTools.Policies.alphavectors"><code>POMDPTools.Policies.alphavectors</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Return the alpha vectors.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/alpha_vector.jl#L56-L58">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.alphapairs" href="#POMDPTools.Policies.alphapairs"><code>POMDPTools.Policies.alphapairs</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Return an iterator of alpha vector-action pairs in the policy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/alpha_vector.jl#L51-L53">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.beliefvec" href="#POMDPTools.Policies.beliefvec"><code>POMDPTools.Policies.beliefvec</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">POMDPTools.Policies.beliefvec(m::POMDP, n_states::Int, b)</code></pre><p>Return a vector-like representation of the belief <code>b</code> suitable for calculating the dot product with the alpha vectors.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/alpha_vector.jl#L97-L101">source</a></section></article><h2 id="Random-Policy"><a class="docs-heading-anchor" href="#Random-Policy">Random Policy</a><a id="Random-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Random-Policy" title="Permalink"></a></h2><p>A policy that returns a randomly selected action using <code>rand(rng, actions(pomdp))</code>.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.RandomPolicy" href="#POMDPTools.Policies.RandomPolicy"><code>POMDPTools.Policies.RandomPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">RandomPolicy{RNG&lt;:AbstractRNG, P&lt;:Union{POMDP,MDP}, U&lt;:Updater}</code></pre><p>a generic policy that uses the actions function to create a list of actions and then randomly samples an action from it.</p><p>Constructor:</p><pre><code class="nohighlight hljs">`RandomPolicy(problem::Union{POMDP,MDP};
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Implemented Policies · POMDPs.jl</title><meta name="title" content="Implemented Policies · POMDPs.jl"/><meta property="og:title" content="Implemented Policies · POMDPs.jl"/><meta property="twitter:title" content="Implemented Policies · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li><a class="tocitem" href="../visualization/">Visualization</a></li><li><a class="tocitem" href="../beliefs/">Implemented Belief Updaters</a></li><li class="is-active"><a class="tocitem" href>Implemented Policies</a><ul class="internal"><li><a class="tocitem" href="#Function"><span>Function</span></a></li><li><a class="tocitem" href="#Alpha-Vector-Policy"><span>Alpha Vector Policy</span></a></li><li><a class="tocitem" href="#Random-Policy"><span>Random Policy</span></a></li><li><a class="tocitem" href="#Stochastic-Policies"><span>Stochastic Policies</span></a></li><li><a class="tocitem" href="#Vector-Policies"><span>Vector Policies</span></a></li><li><a class="tocitem" href="#Value-Dict-Policy"><span>Value Dict Policy</span></a></li><li><a class="tocitem" href="#Exploration-Policies"><span>Exploration Policies</span></a></li><li><a class="tocitem" href="#Playback-Policy"><span>Playback Policy</span></a></li><li><a class="tocitem" href="#Utility-Wrapper"><span>Utility Wrapper</span></a></li><li><a class="tocitem" href="#Pretty-Printing-Policies"><span>Pretty Printing Policies</span></a></li><li class="toplevel"><a class="tocitem" href="#Policy-Evaluation"><span>Policy Evaluation</span></a></li></ul></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Implemented Policies</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Implemented Policies</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/policies.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Implemented-Policies"><a class="docs-heading-anchor" href="#Implemented-Policies">Implemented Policies</a><a id="Implemented-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Implemented-Policies" title="Permalink"></a></h1><p>POMDPTools currently provides the following policy types:</p><ul><li>a wrapper to turn a function into a <code>Policy</code></li><li>an alpha vector policy type</li><li>a random policy</li><li>a stochastic policy type</li><li>exploration policies</li><li>a vector policy type</li><li>a wrapper to collect statistics and errors about policies</li></ul><p>In addition, it provides the <a href="#POMDPTools.Policies.showpolicy"><code>showpolicy</code></a> function for printing policies similar to the way that matrices are printed in the repl and the <a href="#POMDPTools.Policies.evaluate"><code>evaluate</code></a> function for evaluating MDP policies.</p><h2 id="Function"><a class="docs-heading-anchor" href="#Function">Function</a><a id="Function-1"></a><a class="docs-heading-anchor-permalink" href="#Function" title="Permalink"></a></h2><p>Wraps a <code>Function</code> mapping states to actions into a <code>Policy</code>. </p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.FunctionPolicy" href="#POMDPTools.Policies.FunctionPolicy"><code>POMDPTools.Policies.FunctionPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><p>FunctionPolicy</p><p>Policy <code>p=FunctionPolicy(f)</code> returns <code>f(x)</code> when <code>action(p, x)</code> is called.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/function.jl#L5-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.FunctionSolver" href="#POMDPTools.Policies.FunctionSolver"><code>POMDPTools.Policies.FunctionSolver</code></a> — <span class="docstring-category">Type</span></header><section><div><p>FunctionSolver</p><p>Solver for a FunctionPolicy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/function.jl#L14-L18">source</a></section></article><h2 id="Alpha-Vector-Policy"><a class="docs-heading-anchor" href="#Alpha-Vector-Policy">Alpha Vector Policy</a><a id="Alpha-Vector-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Alpha-Vector-Policy" title="Permalink"></a></h2><p>Represents a policy with a set of alpha vectors (See <code>AlphaVectorPolicy</code> constructor docstring). In addition to finding the optimal action with <code>action</code>, the alpha vectors can be accessed with <a href="#POMDPTools.Policies.alphavectors"><code>alphavectors</code></a> or <a href="#POMDPTools.Policies.alphapairs"><code>alphapairs</code></a>.</p><p>Determining the estimated value and optimal action depends on calculating the dot product between alpha vectors and a belief vector. <a href="#POMDPTools.Policies.beliefvec"><code>POMDPTools.Policies.beliefvec(pomdp, b)</code></a> is used to create this vector and can be overridden for new belief types for efficiency.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.AlphaVectorPolicy" href="#POMDPTools.Policies.AlphaVectorPolicy"><code>POMDPTools.Policies.AlphaVectorPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">AlphaVectorPolicy(pomdp::POMDP, alphas, action_map)</code></pre><p>Construct a policy from alpha vectors.</p><p><strong>Arguments</strong></p><ul><li><p><code>alphas</code>: an |S| x (number of alpha vecs) matrix or a vector of alpha vectors.</p></li><li><p><code>action_map</code>: a vector of the actions correponding to each alpha vector</p><p>AlphaVectorPolicy{P&lt;:POMDP, A}</p></li></ul><p>Represents a policy with a set of alpha vectors.</p><p>Use <code>action</code> to get the best action for a belief, and <code>alphavectors</code> and <code>alphapairs</code> to </p><p><strong>Fields</strong></p><ul><li><code>pomdp::P</code> the POMDP problem </li><li><code>n_states::Int</code> the number of states in the POMDP</li><li><code>alphas::Vector{Vector{Float64}}</code> the list of alpha vectors</li><li><code>action_map::Vector{A}</code> a list of action corresponding to the alpha vectors</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/alpha_vector.jl#L1-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.alphavectors" href="#POMDPTools.Policies.alphavectors"><code>POMDPTools.Policies.alphavectors</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Return the alpha vectors.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/alpha_vector.jl#L56-L58">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.alphapairs" href="#POMDPTools.Policies.alphapairs"><code>POMDPTools.Policies.alphapairs</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Return an iterator of alpha vector-action pairs in the policy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/alpha_vector.jl#L51-L53">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.beliefvec" href="#POMDPTools.Policies.beliefvec"><code>POMDPTools.Policies.beliefvec</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">POMDPTools.Policies.beliefvec(m::POMDP, n_states::Int, b)</code></pre><p>Return a vector-like representation of the belief <code>b</code> suitable for calculating the dot product with the alpha vectors.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/alpha_vector.jl#L97-L101">source</a></section></article><h2 id="Random-Policy"><a class="docs-heading-anchor" href="#Random-Policy">Random Policy</a><a id="Random-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Random-Policy" title="Permalink"></a></h2><p>A policy that returns a randomly selected action using <code>rand(rng, actions(pomdp))</code>.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.RandomPolicy" href="#POMDPTools.Policies.RandomPolicy"><code>POMDPTools.Policies.RandomPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">RandomPolicy{RNG&lt;:AbstractRNG, P&lt;:Union{POMDP,MDP}, U&lt;:Updater}</code></pre><p>a generic policy that uses the actions function to create a list of actions and then randomly samples an action from it.</p><p>Constructor:</p><pre><code class="nohighlight hljs">`RandomPolicy(problem::Union{POMDP,MDP};
          rng=Random.default_rng(),
-         updater=NothingUpdater())`</code></pre><p><strong>Fields</strong></p><ul><li><code>rng::RNG</code> a random number generator </li><li><code>probelm::P</code> the POMDP or MDP problem </li><li><code>updater::U</code> a belief updater (default to <code>NothingUpdater</code> in the above constructor)</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/random.jl#L3-L17">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.RandomSolver" href="#POMDPTools.Policies.RandomSolver"><code>POMDPTools.Policies.RandomSolver</code></a> — <span class="docstring-category">Type</span></header><section><div><p>solver that produces a random policy</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/random.jl#L40-L42">source</a></section></article><h2 id="Stochastic-Policies"><a class="docs-heading-anchor" href="#Stochastic-Policies">Stochastic Policies</a><a id="Stochastic-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Stochastic-Policies" title="Permalink"></a></h2><p>Types for representing randomized policies:</p><ul><li><code>StochasticPolicy</code> samples actions from an arbitrary distribution.</li><li><code>UniformRandomPolicy</code> samples actions uniformly (see <code>RandomPolicy</code> for a similar use)</li><li><code>CategoricalTabularPolicy</code> samples actions from a categorical distribution with weights given by a <code>ValuePolicy</code>.</li></ul><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.StochasticPolicy" href="#POMDPTools.Policies.StochasticPolicy"><code>POMDPTools.Policies.StochasticPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><p>StochasticPolicy{D, RNG &lt;: AbstractRNG}</p><p>Represents a stochastic policy. Action are sampled from an arbitrary distribution.</p><p>Constructor:</p><pre><code class="nohighlight hljs">`StochasticPolicy(distribution; rng=Random.default_rng())`</code></pre><p><strong>Fields</strong></p><ul><li><code>distribution::D</code></li><li><code>rng::RNG</code> a random number generator</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/stochastic.jl#L4-L16">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.CategoricalTabularPolicy" href="#POMDPTools.Policies.CategoricalTabularPolicy"><code>POMDPTools.Policies.CategoricalTabularPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">CategoricalTabularPolicy</code></pre><p>represents a stochastic policy sampling an action from a categorical distribution with weights given by a <code>ValuePolicy</code></p><p>constructor:</p><p><code>CategoricalTabularPolicy(mdp::Union{POMDP,MDP}; rng=Random.default_rng())</code></p><p><strong>Fields</strong></p><ul><li><code>stochastic::StochasticPolicy</code></li><li><code>value::ValuePolicy</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/stochastic.jl#L35-L47">source</a></section></article><h2 id="Vector-Policies"><a class="docs-heading-anchor" href="#Vector-Policies">Vector Policies</a><a id="Vector-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Vector-Policies" title="Permalink"></a></h2><p>Tabular policies including the following:</p><ul><li><code>VectorPolicy</code> holds a vector of actions, one for each state, ordered according to <a href="../../api/#POMDPs.stateindex"><code>stateindex</code></a>.</li><li><code>ValuePolicy</code> holds a matrix of values for state-action pairs and chooses the action with the highest value at the given state</li></ul><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.VectorPolicy" href="#POMDPTools.Policies.VectorPolicy"><code>POMDPTools.Policies.VectorPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">VectorPolicy{S,A}</code></pre><p>A generic MDP policy that consists of a vector of actions. The entry at <code>stateindex(mdp, s)</code> is the action that will be taken in state <code>s</code>.</p><p><strong>Fields</strong></p><ul><li><code>mdp::MDP{S,A}</code> the MDP problem</li><li><code>act::Vector{A}</code> a vector of size |S| mapping state indices to actions</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/vector.jl#L4-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.VectorSolver" href="#POMDPTools.Policies.VectorSolver"><code>POMDPTools.Policies.VectorSolver</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">VectorSolver{A}</code></pre><p>Solver for VectorPolicy. Doesn&#39;t do any computation - just sets the action vector.</p><p><strong>Fields</strong></p><ul><li><code>act::Vector{A}</code> the action vector</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/vector.jl#L19-L25">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.ValuePolicy" href="#POMDPTools.Policies.ValuePolicy"><code>POMDPTools.Policies.ValuePolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs"> ValuePolicy{P&lt;:Union{POMDP,MDP}, T&lt;:AbstractMatrix{Float64}, A}</code></pre><p>A generic MDP policy that consists of a value table. The entry at <code>stateindex(mdp, s)</code> is the action that will be taken in state <code>s</code>. It is expected that the order of the actions in the value table is consistent with the order of the actions in <code>act</code>.  If <code>act</code> is not explicitly set in the construction, <code>act</code> is ordered according to <code>actionindex</code>.</p><p><strong>Fields</strong></p><ul><li><code>mdp::P</code> the MDP problem</li><li><code>value_table::T</code> the value table as a |S|x|A| matrix</li><li><code>act::Vector{A}</code> the possible actions</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/vector.jl#L42-L52">source</a></section></article><h2 id="Value-Dict-Policy"><a class="docs-heading-anchor" href="#Value-Dict-Policy">Value Dict Policy</a><a id="Value-Dict-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Value-Dict-Policy" title="Permalink"></a></h2><p><code>ValueDictPolicy</code> holds a dictionary of values, where the key is state-action tuple, and chooses the action with the highest value at the given state. It allows one to write solvers without enumerating state and action spaces, but actions and states must support <code>Base.isequal()</code> and <code>Base.hash()</code>.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.ValueDictPolicy" href="#POMDPTools.Policies.ValueDictPolicy"><code>POMDPTools.Policies.ValueDictPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs"> ValueDictPolicy(mdp)</code></pre><p>A generic MDP policy that consists of a <code>Dict</code> storing Q-values for state-action pairs. If there are no entries higher than a default value, this will fall back to a default policy.</p><p><strong>Keyword Arguments</strong></p><ul><li><code>value_table::AbstractDict</code> the value dict, key is (s, a) Tuple.</li><li><code>default_value::Float64</code> the defalut value of <code>value_dict</code>.</li><li><code>default_policy::Policy</code> the policy taken when no action has a value higher than <code>default_value</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/dict.jl#L1-L10">source</a></section></article><h2 id="Exploration-Policies"><a class="docs-heading-anchor" href="#Exploration-Policies">Exploration Policies</a><a id="Exploration-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Exploration-Policies" title="Permalink"></a></h2><p>Exploration policies are often useful for Reinforcement Learning algorithm to choose an action that is different than the action given by the policy being learned (<code>on_policy</code>). </p><p>Exploration policies are subtype of the abstract <code>ExplorationPolicy</code> type and they follow the following interface:  <code>action(exploration_policy::ExplorationPolicy, on_policy::Policy, k, s)</code>. <code>k</code> is used to compute the value of the exploration parameter (see <a href="#Schedule">Schedule</a>), and <code>s</code> is the current state or observation in which the agent is taking an action.</p><p>The <code>action</code> method is exported by <a href="https://github.com/JuliaPOMDP/POMDPs.jl">POMDPs.jl</a>.  To use exploration policies in a solver, you must use the four argument version of <code>action</code> where <code>on_policy</code> is the policy being learned (e.g. tabular policy or neural network policy).</p><p>This package provides two exploration policies: <code>EpsGreedyPolicy</code> and <code>SoftmaxPolicy</code></p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.EpsGreedyPolicy" href="#POMDPTools.Policies.EpsGreedyPolicy"><code>POMDPTools.Policies.EpsGreedyPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">EpsGreedyPolicy &lt;: ExplorationPolicy</code></pre><p>represents an epsilon greedy policy, sampling a random action with a probability <code>eps</code> or returning an action from a given policy otherwise. The evolution of epsilon can be controlled using a schedule. This feature is useful for using those policies in reinforcement learning algorithms. </p><p><strong>Constructor:</strong></p><p><code>EpsGreedyPolicy(problem::Union{MDP, POMDP}, eps::Union{Function, Float64}; rng=Random.default_rng(), schedule=ConstantSchedule)</code></p><p>If a function is passed for <code>eps</code>, <code>eps(k)</code> is called to compute the value of epsilon when calling <code>action(exploration_policy, on_policy, k, s)</code>.</p><p><strong>Fields</strong></p><ul><li><code>eps::Function</code></li><li><code>rng::AbstractRNG</code></li><li><code>m::M</code> POMDPs or MDPs problem</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/exploration_policies.jl#L38-L56">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.SoftmaxPolicy" href="#POMDPTools.Policies.SoftmaxPolicy"><code>POMDPTools.Policies.SoftmaxPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SoftmaxPolicy &lt;: ExplorationPolicy</code></pre><p>represents a softmax policy, sampling a random action according to a softmax function.  The softmax function converts the action values of the on policy into probabilities that are used for sampling.  A temperature parameter or function can be used to make the resulting distribution more or less wide.</p><p><strong>Constructor</strong></p><p><code>SoftmaxPolicy(problem, temperature::Union{Function, Float64}; rng=Random.default_rng())</code></p><p>If a function is passed for <code>temperature</code>, <code>temperature(k)</code> is called to compute the value of the temperature when calling <code>action(exploration_policy, on_policy, k, s)</code></p><p><strong>Fields</strong></p><ul><li><code>temperature::Function</code></li><li><code>rng::AbstractRNG</code></li><li><code>actions::A</code> an indexable list of action</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/exploration_policies.jl#L84-L103">source</a></section></article><h3 id="Schedule"><a class="docs-heading-anchor" href="#Schedule">Schedule</a><a id="Schedule-1"></a><a class="docs-heading-anchor-permalink" href="#Schedule" title="Permalink"></a></h3><p>Exploration policies often rely on a key parameter: <span>$\epsilon$</span> in <span>$\epsilon$</span>-greedy and the temperature in softmax for example.  Reinforcement learning algorithms often require a decay schedule for these parameters.  Schedule can be passed to an exploration policy as functions. For example one can define an epsilon greedy policy with an exponential decay schedule as follow: </p><pre><code class="language-julia hljs">    m # your mdp or pomdp model
-    exploration_policy = EpsGreedyPolicy(m, k-&gt;0.05*0.9^(k/10))</code></pre><p><code>POMDPTools</code> exports a linear decay schedule object that can be used as well.  </p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.LinearDecaySchedule" href="#POMDPTools.Policies.LinearDecaySchedule"><code>POMDPTools.Policies.LinearDecaySchedule</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">LinearDecaySchedule</code></pre><p>A schedule that linearly decreases a value from <code>start</code> to <code>stop</code> in <code>steps</code> steps. if the value is greater or equal to <code>stop</code>, it stays constant.</p><p><strong>Constructor</strong></p><p><code>LinearDecaySchedule(;start, stop, steps)</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/exploration_policies.jl#L1-L9">source</a></section></article><h2 id="Playback-Policy"><a class="docs-heading-anchor" href="#Playback-Policy">Playback Policy</a><a id="Playback-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Playback-Policy" title="Permalink"></a></h2><p>A policy that replays a fixed sequence of actions. When all actions are used, a backup policy is used.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.PlaybackPolicy" href="#POMDPTools.Policies.PlaybackPolicy"><code>POMDPTools.Policies.PlaybackPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">PlaybackPolicy{A&lt;:AbstractArray, P&lt;:Policy, V&lt;:AbstractArray{&lt;:Real}}</code></pre><p>a policy that applies a fixed sequence of actions until they are all used and then falls back onto a backup policy until the end of the episode.</p><p>Constructor:</p><pre><code class="nohighlight hljs">`PlaybackPolicy(actions::AbstractArray, backup_policy::Policy; logpdfs::AbstractArray{Float64, 1} = Float64[])`</code></pre><p><strong>Fields</strong></p><ul><li><code>actions::Vector{A}</code> a vector of actions to play back</li><li><code>backup_policy::Policy</code> the policy to use when all prescribed actions have been taken but the episode continues</li><li><code>logpdfs::Vector{Float64}</code> the log probability (density) of actions</li><li><code>i::Int64</code> the current action index</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/playback.jl#L2-L15">source</a></section></article><h2 id="Utility-Wrapper"><a class="docs-heading-anchor" href="#Utility-Wrapper">Utility Wrapper</a><a id="Utility-Wrapper-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-Wrapper" title="Permalink"></a></h2><p>A wrapper for policies to collect statistics and handle errors.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.PolicyWrapper" href="#POMDPTools.Policies.PolicyWrapper"><code>POMDPTools.Policies.PolicyWrapper</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">PolicyWrapper</code></pre><p>Flexible utility wrapper for a policy designed for collecting statistics about planning.</p><p>Carries a function, a policy, and optionally a payload (that can be any type).</p><p>The function should typically be defined with the do syntax. Each time <code>action</code> is called on the wrapper, this function will be called.</p><p>If there is no payload, it will be called with two argments: the policy and the state/belief. If there is a payload, it will be called with three arguments: the policy, the payload, and the current state or belief. The function should return an appropriate action. The idea is that, in this function, <code>action(policy, s)</code> should be called, statistics from the policy/planner should be collected and saved in the payload, exceptions can be handled, and the action should be returned.</p><p>Constructor</p><p><code>PolicyWrapper(policy::Policy; payload=nothing)</code></p><p><strong>Example</strong></p><pre><code class="language-julia hljs">using POMDPModels
+         updater=NothingUpdater())`</code></pre><p><strong>Fields</strong></p><ul><li><code>rng::RNG</code> a random number generator </li><li><code>probelm::P</code> the POMDP or MDP problem </li><li><code>updater::U</code> a belief updater (default to <code>NothingUpdater</code> in the above constructor)</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/random.jl#L3-L17">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.RandomSolver" href="#POMDPTools.Policies.RandomSolver"><code>POMDPTools.Policies.RandomSolver</code></a> — <span class="docstring-category">Type</span></header><section><div><p>solver that produces a random policy</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/random.jl#L40-L42">source</a></section></article><h2 id="Stochastic-Policies"><a class="docs-heading-anchor" href="#Stochastic-Policies">Stochastic Policies</a><a id="Stochastic-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Stochastic-Policies" title="Permalink"></a></h2><p>Types for representing randomized policies:</p><ul><li><code>StochasticPolicy</code> samples actions from an arbitrary distribution.</li><li><code>UniformRandomPolicy</code> samples actions uniformly (see <code>RandomPolicy</code> for a similar use)</li><li><code>CategoricalTabularPolicy</code> samples actions from a categorical distribution with weights given by a <code>ValuePolicy</code>.</li></ul><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.StochasticPolicy" href="#POMDPTools.Policies.StochasticPolicy"><code>POMDPTools.Policies.StochasticPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><p>StochasticPolicy{D, RNG &lt;: AbstractRNG}</p><p>Represents a stochastic policy. Action are sampled from an arbitrary distribution.</p><p>Constructor:</p><pre><code class="nohighlight hljs">`StochasticPolicy(distribution; rng=Random.default_rng())`</code></pre><p><strong>Fields</strong></p><ul><li><code>distribution::D</code></li><li><code>rng::RNG</code> a random number generator</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/stochastic.jl#L4-L16">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.CategoricalTabularPolicy" href="#POMDPTools.Policies.CategoricalTabularPolicy"><code>POMDPTools.Policies.CategoricalTabularPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">CategoricalTabularPolicy</code></pre><p>represents a stochastic policy sampling an action from a categorical distribution with weights given by a <code>ValuePolicy</code></p><p>constructor:</p><p><code>CategoricalTabularPolicy(mdp::Union{POMDP,MDP}; rng=Random.default_rng())</code></p><p><strong>Fields</strong></p><ul><li><code>stochastic::StochasticPolicy</code></li><li><code>value::ValuePolicy</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/stochastic.jl#L35-L47">source</a></section></article><h2 id="Vector-Policies"><a class="docs-heading-anchor" href="#Vector-Policies">Vector Policies</a><a id="Vector-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Vector-Policies" title="Permalink"></a></h2><p>Tabular policies including the following:</p><ul><li><code>VectorPolicy</code> holds a vector of actions, one for each state, ordered according to <a href="../../api/#POMDPs.stateindex"><code>stateindex</code></a>.</li><li><code>ValuePolicy</code> holds a matrix of values for state-action pairs and chooses the action with the highest value at the given state</li></ul><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.VectorPolicy" href="#POMDPTools.Policies.VectorPolicy"><code>POMDPTools.Policies.VectorPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">VectorPolicy{S,A}</code></pre><p>A generic MDP policy that consists of a vector of actions. The entry at <code>stateindex(mdp, s)</code> is the action that will be taken in state <code>s</code>.</p><p><strong>Fields</strong></p><ul><li><code>mdp::MDP{S,A}</code> the MDP problem</li><li><code>act::Vector{A}</code> a vector of size |S| mapping state indices to actions</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/vector.jl#L4-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.VectorSolver" href="#POMDPTools.Policies.VectorSolver"><code>POMDPTools.Policies.VectorSolver</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">VectorSolver{A}</code></pre><p>Solver for VectorPolicy. Doesn&#39;t do any computation - just sets the action vector.</p><p><strong>Fields</strong></p><ul><li><code>act::Vector{A}</code> the action vector</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/vector.jl#L19-L25">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.ValuePolicy" href="#POMDPTools.Policies.ValuePolicy"><code>POMDPTools.Policies.ValuePolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs"> ValuePolicy{P&lt;:Union{POMDP,MDP}, T&lt;:AbstractMatrix{Float64}, A}</code></pre><p>A generic MDP policy that consists of a value table. The entry at <code>stateindex(mdp, s)</code> is the action that will be taken in state <code>s</code>. It is expected that the order of the actions in the value table is consistent with the order of the actions in <code>act</code>.  If <code>act</code> is not explicitly set in the construction, <code>act</code> is ordered according to <code>actionindex</code>.</p><p><strong>Fields</strong></p><ul><li><code>mdp::P</code> the MDP problem</li><li><code>value_table::T</code> the value table as a |S|x|A| matrix</li><li><code>act::Vector{A}</code> the possible actions</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/vector.jl#L42-L52">source</a></section></article><h2 id="Value-Dict-Policy"><a class="docs-heading-anchor" href="#Value-Dict-Policy">Value Dict Policy</a><a id="Value-Dict-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Value-Dict-Policy" title="Permalink"></a></h2><p><code>ValueDictPolicy</code> holds a dictionary of values, where the key is state-action tuple, and chooses the action with the highest value at the given state. It allows one to write solvers without enumerating state and action spaces, but actions and states must support <code>Base.isequal()</code> and <code>Base.hash()</code>.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.ValueDictPolicy" href="#POMDPTools.Policies.ValueDictPolicy"><code>POMDPTools.Policies.ValueDictPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs"> ValueDictPolicy(mdp)</code></pre><p>A generic MDP policy that consists of a <code>Dict</code> storing Q-values for state-action pairs. If there are no entries higher than a default value, this will fall back to a default policy.</p><p><strong>Keyword Arguments</strong></p><ul><li><code>value_table::AbstractDict</code> the value dict, key is (s, a) Tuple.</li><li><code>default_value::Float64</code> the defalut value of <code>value_dict</code>.</li><li><code>default_policy::Policy</code> the policy taken when no action has a value higher than <code>default_value</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/dict.jl#L1-L10">source</a></section></article><h2 id="Exploration-Policies"><a class="docs-heading-anchor" href="#Exploration-Policies">Exploration Policies</a><a id="Exploration-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Exploration-Policies" title="Permalink"></a></h2><p>Exploration policies are often useful for Reinforcement Learning algorithm to choose an action that is different than the action given by the policy being learned (<code>on_policy</code>). </p><p>Exploration policies are subtype of the abstract <code>ExplorationPolicy</code> type and they follow the following interface:  <code>action(exploration_policy::ExplorationPolicy, on_policy::Policy, k, s)</code>. <code>k</code> is used to compute the value of the exploration parameter (see <a href="#Schedule">Schedule</a>), and <code>s</code> is the current state or observation in which the agent is taking an action.</p><p>The <code>action</code> method is exported by <a href="https://github.com/JuliaPOMDP/POMDPs.jl">POMDPs.jl</a>.  To use exploration policies in a solver, you must use the four argument version of <code>action</code> where <code>on_policy</code> is the policy being learned (e.g. tabular policy or neural network policy).</p><p>This package provides two exploration policies: <code>EpsGreedyPolicy</code> and <code>SoftmaxPolicy</code></p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.EpsGreedyPolicy" href="#POMDPTools.Policies.EpsGreedyPolicy"><code>POMDPTools.Policies.EpsGreedyPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">EpsGreedyPolicy &lt;: ExplorationPolicy</code></pre><p>represents an epsilon greedy policy, sampling a random action with a probability <code>eps</code> or returning an action from a given policy otherwise. The evolution of epsilon can be controlled using a schedule. This feature is useful for using those policies in reinforcement learning algorithms. </p><p><strong>Constructor:</strong></p><p><code>EpsGreedyPolicy(problem::Union{MDP, POMDP}, eps::Union{Function, Float64}; rng=Random.default_rng(), schedule=ConstantSchedule)</code></p><p>If a function is passed for <code>eps</code>, <code>eps(k)</code> is called to compute the value of epsilon when calling <code>action(exploration_policy, on_policy, k, s)</code>.</p><p><strong>Fields</strong></p><ul><li><code>eps::Function</code></li><li><code>rng::AbstractRNG</code></li><li><code>m::M</code> POMDPs or MDPs problem</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/exploration_policies.jl#L38-L56">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.SoftmaxPolicy" href="#POMDPTools.Policies.SoftmaxPolicy"><code>POMDPTools.Policies.SoftmaxPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SoftmaxPolicy &lt;: ExplorationPolicy</code></pre><p>represents a softmax policy, sampling a random action according to a softmax function.  The softmax function converts the action values of the on policy into probabilities that are used for sampling.  A temperature parameter or function can be used to make the resulting distribution more or less wide.</p><p><strong>Constructor</strong></p><p><code>SoftmaxPolicy(problem, temperature::Union{Function, Float64}; rng=Random.default_rng())</code></p><p>If a function is passed for <code>temperature</code>, <code>temperature(k)</code> is called to compute the value of the temperature when calling <code>action(exploration_policy, on_policy, k, s)</code></p><p><strong>Fields</strong></p><ul><li><code>temperature::Function</code></li><li><code>rng::AbstractRNG</code></li><li><code>actions::A</code> an indexable list of action</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/exploration_policies.jl#L84-L103">source</a></section></article><h3 id="Schedule"><a class="docs-heading-anchor" href="#Schedule">Schedule</a><a id="Schedule-1"></a><a class="docs-heading-anchor-permalink" href="#Schedule" title="Permalink"></a></h3><p>Exploration policies often rely on a key parameter: <span>$\epsilon$</span> in <span>$\epsilon$</span>-greedy and the temperature in softmax for example.  Reinforcement learning algorithms often require a decay schedule for these parameters.  Schedule can be passed to an exploration policy as functions. For example one can define an epsilon greedy policy with an exponential decay schedule as follow: </p><pre><code class="language-julia hljs">    m # your mdp or pomdp model
+    exploration_policy = EpsGreedyPolicy(m, k-&gt;0.05*0.9^(k/10))</code></pre><p><code>POMDPTools</code> exports a linear decay schedule object that can be used as well.  </p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.LinearDecaySchedule" href="#POMDPTools.Policies.LinearDecaySchedule"><code>POMDPTools.Policies.LinearDecaySchedule</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">LinearDecaySchedule</code></pre><p>A schedule that linearly decreases a value from <code>start</code> to <code>stop</code> in <code>steps</code> steps. if the value is greater or equal to <code>stop</code>, it stays constant.</p><p><strong>Constructor</strong></p><p><code>LinearDecaySchedule(;start, stop, steps)</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/exploration_policies.jl#L1-L9">source</a></section></article><h2 id="Playback-Policy"><a class="docs-heading-anchor" href="#Playback-Policy">Playback Policy</a><a id="Playback-Policy-1"></a><a class="docs-heading-anchor-permalink" href="#Playback-Policy" title="Permalink"></a></h2><p>A policy that replays a fixed sequence of actions. When all actions are used, a backup policy is used.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.PlaybackPolicy" href="#POMDPTools.Policies.PlaybackPolicy"><code>POMDPTools.Policies.PlaybackPolicy</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">PlaybackPolicy{A&lt;:AbstractArray, P&lt;:Policy, V&lt;:AbstractArray{&lt;:Real}}</code></pre><p>a policy that applies a fixed sequence of actions until they are all used and then falls back onto a backup policy until the end of the episode.</p><p>Constructor:</p><pre><code class="nohighlight hljs">`PlaybackPolicy(actions::AbstractArray, backup_policy::Policy; logpdfs::AbstractArray{Float64, 1} = Float64[])`</code></pre><p><strong>Fields</strong></p><ul><li><code>actions::Vector{A}</code> a vector of actions to play back</li><li><code>backup_policy::Policy</code> the policy to use when all prescribed actions have been taken but the episode continues</li><li><code>logpdfs::Vector{Float64}</code> the log probability (density) of actions</li><li><code>i::Int64</code> the current action index</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/playback.jl#L2-L15">source</a></section></article><h2 id="Utility-Wrapper"><a class="docs-heading-anchor" href="#Utility-Wrapper">Utility Wrapper</a><a id="Utility-Wrapper-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-Wrapper" title="Permalink"></a></h2><p>A wrapper for policies to collect statistics and handle errors.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.PolicyWrapper" href="#POMDPTools.Policies.PolicyWrapper"><code>POMDPTools.Policies.PolicyWrapper</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">PolicyWrapper</code></pre><p>Flexible utility wrapper for a policy designed for collecting statistics about planning.</p><p>Carries a function, a policy, and optionally a payload (that can be any type).</p><p>The function should typically be defined with the do syntax. Each time <code>action</code> is called on the wrapper, this function will be called.</p><p>If there is no payload, it will be called with two argments: the policy and the state/belief. If there is a payload, it will be called with three arguments: the policy, the payload, and the current state or belief. The function should return an appropriate action. The idea is that, in this function, <code>action(policy, s)</code> should be called, statistics from the policy/planner should be collected and saved in the payload, exceptions can be handled, and the action should be returned.</p><p>Constructor</p><p><code>PolicyWrapper(policy::Policy; payload=nothing)</code></p><p><strong>Example</strong></p><pre><code class="language-julia hljs">using POMDPModels
 using POMDPToolbox
 
 mdp = GridWorld()
@@ -32,10 +32,10 @@
     return a
 end
 
-h = simulate(HistoryRecorder(max_steps=100), mdp, errwrapper)</code></pre><p><strong>Fields</strong></p><ul><li><code>f::F</code></li><li><code>policy::P</code></li><li><code>payload::PL</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/utility_wrapper.jl#L1-L56">source</a></section></article><h2 id="Pretty-Printing-Policies"><a class="docs-heading-anchor" href="#Pretty-Printing-Policies">Pretty Printing Policies</a><a id="Pretty-Printing-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Pretty-Printing-Policies" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.showpolicy" href="#POMDPTools.Policies.showpolicy"><code>POMDPTools.Policies.showpolicy</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">showpolicy([io], [mime], m::MDP, p::Policy)
+h = simulate(HistoryRecorder(max_steps=100), mdp, errwrapper)</code></pre><p><strong>Fields</strong></p><ul><li><code>f::F</code></li><li><code>policy::P</code></li><li><code>payload::PL</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/utility_wrapper.jl#L1-L56">source</a></section></article><h2 id="Pretty-Printing-Policies"><a class="docs-heading-anchor" href="#Pretty-Printing-Policies">Pretty Printing Policies</a><a id="Pretty-Printing-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Pretty-Printing-Policies" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.showpolicy" href="#POMDPTools.Policies.showpolicy"><code>POMDPTools.Policies.showpolicy</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">showpolicy([io], [mime], m::MDP, p::Policy)
 showpolicy([io], [mime], statelist::AbstractVector, p::Policy)
-showpolicy(...; pre=&quot; &quot;)</code></pre><p>Print the states in <code>m</code> or <code>statelist</code> and the actions from policy <code>p</code> corresponding to those states.</p><p>For the MDP version, if <code>io[:limit]</code> is <code>true</code>, will only print enough states to fill the display.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/pretty_printing.jl#L1-L9">source</a></section></article><h1 id="Policy-Evaluation"><a class="docs-heading-anchor" href="#Policy-Evaluation">Policy Evaluation</a><a id="Policy-Evaluation-1"></a><a class="docs-heading-anchor-permalink" href="#Policy-Evaluation" title="Permalink"></a></h1><p>The <a href="#POMDPTools.Policies.evaluate"><code>evaluate</code></a> function provides a policy evaluation tool for MDPs:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.evaluate" href="#POMDPTools.Policies.evaluate"><code>POMDPTools.Policies.evaluate</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">evaluate(m::MDP, p::Policy)
+showpolicy(...; pre=&quot; &quot;)</code></pre><p>Print the states in <code>m</code> or <code>statelist</code> and the actions from policy <code>p</code> corresponding to those states.</p><p>For the MDP version, if <code>io[:limit]</code> is <code>true</code>, will only print enough states to fill the display.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/pretty_printing.jl#L1-L9">source</a></section></article><h1 id="Policy-Evaluation"><a class="docs-heading-anchor" href="#Policy-Evaluation">Policy Evaluation</a><a id="Policy-Evaluation-1"></a><a class="docs-heading-anchor-permalink" href="#Policy-Evaluation" title="Permalink"></a></h1><p>The <a href="#POMDPTools.Policies.evaluate"><code>evaluate</code></a> function provides a policy evaluation tool for MDPs:</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Policies.evaluate" href="#POMDPTools.Policies.evaluate"><code>POMDPTools.Policies.evaluate</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">evaluate(m::MDP, p::Policy)
 evaluate(m::MDP, p::Policy; rewardfunction=POMDPs.reward)</code></pre><p>Calculate the value for a policy on an MDP using the approach in equation 4.2.2 of Kochenderfer, <em>Decision Making Under Uncertainty</em>, 2015.</p><p>Returns a DiscreteValueFunction, which maps states to values.</p><p><strong>Example</strong></p><pre><code class="nohighlight hljs">using POMDPTools, POMDPModels
 m = SimpleGridWorld()
 u = evaluate(m, FunctionPolicy(x-&gt;:left))
-u([1,1]) # value of always moving left starting at state [1,1]</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Policies/policy_evaluation.jl#L13-L28">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../beliefs/">« Implemented Belief Updaters</a><a class="docs-footer-nextpage" href="../simulators/">Implemented Simulators »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+u([1,1]) # value of always moving left starting at state [1,1]</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Policies/policy_evaluation.jl#L13-L28">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../beliefs/">« Implemented Belief Updaters</a><a class="docs-footer-nextpage" href="../simulators/">Implemented Simulators »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/simulators/index.html b/dev/POMDPTools/simulators/index.html
index 13fb9054..24902db1 100644
--- a/dev/POMDPTools/simulators/index.html
+++ b/dev/POMDPTools/simulators/index.html
@@ -16,7 +16,7 @@
     println(&quot;in state $s&quot;)
     println(&quot;took action $a&quot;)
     println(&quot;received observation $o and reward $r&quot;)
-end</code></pre><p>The optional <code>spec</code> argument can be a string, tuple of symbols, or single symbol and follows the same pattern as <a href="#eachstep"><code>eachstep</code></a> called on a <code>SimHistory</code> object.</p><p>Under the hood, this function creates a <code>StepSimulator</code> with <code>spec</code> and returns a <code>[PO]MDPSimIterator</code> by calling simulate with all of the arguments except <code>spec</code>. All keyword arguments are passed to the <code>StepSimulator</code> constructor.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/stepthrough.jl#L158-L180">source</a></section></article><p>The <code>StepSimulator</code> contained in this file can provide the same functionality with the following syntax:</p><pre><code class="language-julia hljs">sim = StepSimulator(&quot;s,a,r,sp&quot;)
+end</code></pre><p>The optional <code>spec</code> argument can be a string, tuple of symbols, or single symbol and follows the same pattern as <a href="#eachstep"><code>eachstep</code></a> called on a <code>SimHistory</code> object.</p><p>Under the hood, this function creates a <code>StepSimulator</code> with <code>spec</code> and returns a <code>[PO]MDPSimIterator</code> by calling simulate with all of the arguments except <code>spec</code>. All keyword arguments are passed to the <code>StepSimulator</code> constructor.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/stepthrough.jl#L158-L180">source</a></section></article><p>The <code>StepSimulator</code> contained in this file can provide the same functionality with the following syntax:</p><pre><code class="language-julia hljs">sim = StepSimulator(&quot;s,a,r,sp&quot;)
 for (s,a,r,sp) in simulate(sim, problem, policy)
     # do something
 end</code></pre><h2 id="Rollouts"><a class="docs-heading-anchor" href="#Rollouts">Rollouts</a><a id="Rollouts-1"></a><a class="docs-heading-anchor-permalink" href="#Rollouts" title="Permalink"></a></h2><p><code>RolloutSimulator</code> is the simplest MDP or POMDP simulator. When <code>simulate</code> is called, it simply simulates a single trajectory of the process and returns the discounted reward.</p><pre><code class="language-julia hljs">rs = RolloutSimulator()
@@ -25,12 +25,12 @@
 
 r = simulate(rs, mdp, policy)</code></pre><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.RolloutSimulator" href="#POMDPTools.Simulators.RolloutSimulator"><code>POMDPTools.Simulators.RolloutSimulator</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">RolloutSimulator(rng, max_steps)
 RolloutSimulator(; &lt;keyword arguments&gt;)</code></pre><p>A fast simulator that just returns the reward</p><p>The simulation will be terminated when either</p><ol><li>a terminal state is reached (as determined by <code>isterminal()</code> or</li><li>the discount factor is as small as <code>eps</code> or</li><li>max_steps have been executed</li></ol><p><strong>Keyword arguments:</strong></p><ul><li>rng::AbstractRNG (default: Random.default_rng()) - A random number generator to use. </li><li>eps::Float64 (default: 0.0) - A small number; if γᵗ where γ is the discount factor and t is the time step becomes smaller than this, the simulation will be terminated.</li><li>max_steps::Int (default: typemax(Int)) - The maximum number of steps to simulate.</li></ul><p><strong>Usage (optional arguments in brackets):</strong></p><pre><code class="nohighlight hljs">ro = RolloutSimulator()
-history = simulate(ro, pomdp, policy, [updater [, init_belief [, init_state]]])</code></pre><p>See also: <a href="#POMDPTools.Simulators.HistoryRecorder"><code>HistoryRecorder</code></a>, <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/rollout.jl#L4-L26">source</a></section></article><h2 id="History-Recorder"><a class="docs-heading-anchor" href="#History-Recorder">History Recorder</a><a id="History-Recorder-1"></a><a class="docs-heading-anchor-permalink" href="#History-Recorder" title="Permalink"></a></h2><p>A <code>HistoryRecorder</code> runs a simulation and records the trajectory. It returns an <code>AbstractVector</code> of <code>NamedTuples</code> - see <a href="#Histories">Histories</a> for more info.</p><pre><code class="language-julia hljs">hr = HistoryRecorder(max_steps=100)
+history = simulate(ro, pomdp, policy, [updater [, init_belief [, init_state]]])</code></pre><p>See also: <a href="#POMDPTools.Simulators.HistoryRecorder"><code>HistoryRecorder</code></a>, <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/rollout.jl#L4-L26">source</a></section></article><h2 id="History-Recorder"><a class="docs-heading-anchor" href="#History-Recorder">History Recorder</a><a id="History-Recorder-1"></a><a class="docs-heading-anchor-permalink" href="#History-Recorder" title="Permalink"></a></h2><p>A <code>HistoryRecorder</code> runs a simulation and records the trajectory. It returns an <code>AbstractVector</code> of <code>NamedTuples</code> - see <a href="#Histories">Histories</a> for more info.</p><pre><code class="language-julia hljs">hr = HistoryRecorder(max_steps=100)
 pomdp = TigerPOMDP()
 policy = RandomPolicy(pomdp)
 
 h = simulate(hr, pomdp, policy)</code></pre><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.HistoryRecorder" href="#POMDPTools.Simulators.HistoryRecorder"><code>POMDPTools.Simulators.HistoryRecorder</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A simulator that records the history for later examination</p><p>The simulation will be terminated when either</p><ol><li>a terminal state is reached (as determined by <code>isterminal()</code> or</li><li>the discount factor is as small as <code>eps</code> or</li><li>max_steps have been executed</li></ol><p>Keyword Arguments:     - <code>rng</code>: The random number generator for the simulation     - <code>capture_exception::Bool</code>: whether to capture an exception and store it in the history, or let it go uncaught, potentially killing the script     - <code>show_progress::Bool</code>: show a progress bar for the simulation     - <code>eps</code>     - <code>max_steps</code></p><p>Usage (optional arguments in brackets):</p><pre><code class="nohighlight hljs">hr = HistoryRecorder()
-history = simulate(hr, pomdp, policy, [updater [, init_belief [, init_state]]])</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/history_recorder.jl#L4-L23">source</a></section></article><h2 id="sim-function"><a class="docs-heading-anchor" href="#sim-function"><code>sim()</code></a><a id="sim-function-1"></a><a class="docs-heading-anchor-permalink" href="#sim-function" title="Permalink"></a></h2><p>The <code>sim</code> function provides a convenient way to interact with a POMDP or MDP environment and return a <a href="#Histories">history</a>. The first argument is a function that is called at every time step and takes a state (in the case of an MDP) or an observation (in the case of a POMDP) as the argument and then returns an action. The second argument is a pomdp or mdp. It is intended to be used with Julia&#39;s <a href="https://docs.julialang.org/en/v1/manual/functions/#Do-Block-Syntax-for-Function-Arguments-1"><code>do</code> syntax</a> as follows:</p><pre><code class="language-julia hljs">pomdp = TigerPOMDP()
+history = simulate(hr, pomdp, policy, [updater [, init_belief [, init_state]]])</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/history_recorder.jl#L4-L23">source</a></section></article><h2 id="sim-function"><a class="docs-heading-anchor" href="#sim-function"><code>sim()</code></a><a id="sim-function-1"></a><a class="docs-heading-anchor-permalink" href="#sim-function" title="Permalink"></a></h2><p>The <code>sim</code> function provides a convenient way to interact with a POMDP or MDP environment and return a <a href="#Histories">history</a>. The first argument is a function that is called at every time step and takes a state (in the case of an MDP) or an observation (in the case of a POMDP) as the argument and then returns an action. The second argument is a pomdp or mdp. It is intended to be used with Julia&#39;s <a href="https://docs.julialang.org/en/v1/manual/functions/#Do-Block-Syntax-for-Function-Arguments-1"><code>do</code> syntax</a> as follows:</p><pre><code class="language-julia hljs">pomdp = TigerPOMDP()
 history = sim(pomdp, max_steps=10) do obs
     println(&quot;Observation was $obs.&quot;)
     return TIGER_OPEN_LEFT
@@ -49,7 +49,7 @@
     return a
 end</code></pre><p>for a POMDP and a belief updater.</p><p><strong>Keyword Arguments</strong></p><p><strong>All Versions</strong></p><ul><li><code>initialstate</code>: the initial state for the simulation</li><li><code>simulator</code>: keyword argument to specify any simulator to run the simulation. If nothing is specified for the simulator, a HistoryRecorder will be used as the simulator, with all keyword arguments forwarded to it, e.g.<pre><code class="nohighlight hljs">sim(mdp, max_steps=100, show_progress=true) do s
     # ...
-end</code></pre>will limit the simulation to 100 steps.</li></ul><p><strong>POMDP version</strong></p><ul><li><code>initialobs</code>: this will control the initial observation given to the policy function. If this is not defined, <code>rand(initialobs(m, s))</code> will be used if it is available. If it is not, <code>missing</code> will be used.</li></ul><p><strong>POMDP and updater version</strong></p><ul><li><code>initialbelief</code>: <code>initialize_belief(updater, initialbelief)</code> is the first belief that will be given to the policy function.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/sim.jl#L4-L56">source</a></section></article><h2 id="Histories"><a class="docs-heading-anchor" href="#Histories">Histories</a><a id="Histories-1"></a><a class="docs-heading-anchor-permalink" href="#Histories" title="Permalink"></a></h2><p>The results produced by <a href="#POMDPTools.Simulators.HistoryRecorder"><code>HistoryRecorder</code></a>s and the <a href="#POMDPTools.Simulators.sim"><code>sim</code></a> function are contained in <code>SimHistory</code> objects.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.SimHistory" href="#POMDPTools.Simulators.SimHistory"><code>POMDPTools.Simulators.SimHistory</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SimHistory</code></pre><p>An (PO)MDP simulation history returned by <code>simulate(::HistoryRecorder, ::Union{MDP,POMDP},...)</code>.</p><p>This is an <code>AbstractVector</code> of <a href="https://docs.julialang.org/en/v1/manual/types/index.html#Named-Tuple-Types-1"><code>NamedTuples</code></a> containing the states, actions, etc.</p><p><strong>Examples</strong></p><pre><code class="nohighlight hljs">hist[1][:s] # returns the first state in the history</code></pre><pre><code class="nohighlight hljs">hist[:a] # returns all of the actions in the history</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/history.jl#L9-L23">source</a></section></article><h3 id="Examples"><a class="docs-heading-anchor" href="#Examples">Examples</a><a id="Examples-1"></a><a class="docs-heading-anchor-permalink" href="#Examples" title="Permalink"></a></h3><pre><code class="language-julia hljs">using POMDPs, POMDPTools, POMDPModels
+end</code></pre>will limit the simulation to 100 steps.</li></ul><p><strong>POMDP version</strong></p><ul><li><code>initialobs</code>: this will control the initial observation given to the policy function. If this is not defined, <code>rand(initialobs(m, s))</code> will be used if it is available. If it is not, <code>missing</code> will be used.</li></ul><p><strong>POMDP and updater version</strong></p><ul><li><code>initialbelief</code>: <code>initialize_belief(updater, initialbelief)</code> is the first belief that will be given to the policy function.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/sim.jl#L4-L56">source</a></section></article><h2 id="Histories"><a class="docs-heading-anchor" href="#Histories">Histories</a><a id="Histories-1"></a><a class="docs-heading-anchor-permalink" href="#Histories" title="Permalink"></a></h2><p>The results produced by <a href="#POMDPTools.Simulators.HistoryRecorder"><code>HistoryRecorder</code></a>s and the <a href="#POMDPTools.Simulators.sim"><code>sim</code></a> function are contained in <code>SimHistory</code> objects.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.SimHistory" href="#POMDPTools.Simulators.SimHistory"><code>POMDPTools.Simulators.SimHistory</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">SimHistory</code></pre><p>An (PO)MDP simulation history returned by <code>simulate(::HistoryRecorder, ::Union{MDP,POMDP},...)</code>.</p><p>This is an <code>AbstractVector</code> of <a href="https://docs.julialang.org/en/v1/manual/types/index.html#Named-Tuple-Types-1"><code>NamedTuples</code></a> containing the states, actions, etc.</p><p><strong>Examples</strong></p><pre><code class="nohighlight hljs">hist[1][:s] # returns the first state in the history</code></pre><pre><code class="nohighlight hljs">hist[:a] # returns all of the actions in the history</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/history.jl#L9-L23">source</a></section></article><h3 id="Examples"><a class="docs-heading-anchor" href="#Examples">Examples</a><a id="Examples-1"></a><a class="docs-heading-anchor-permalink" href="#Examples" title="Permalink"></a></h3><pre><code class="language-julia hljs">using POMDPs, POMDPTools, POMDPModels
 hr = HistoryRecorder(max_steps=10)
 hist = simulate(hr, BabyPOMDP(), FunctionPolicy(x-&gt;true))
 step = hist[1] # all information available about the first step
@@ -60,12 +60,12 @@
     println(&quot;reward $r received when state $sp was reached after action $a was taken in state $s&quot;)
 end</code></pre><p>returns the start state, action, reward and destination state for each step of the simulation.</p><p>Alternatively, instead of expanding the steps implicitly, the elements of the step can be accessed as fields (since each step is a <code>NamedTuple</code>):</p><pre><code class="language-julia hljs">for step in eachstep(h, &quot;(s, a, r, sp)&quot;)    
     println(&quot;reward $(step.r) received when state $(step.sp) was reached after action $(step.a) was taken in state $(step.s)&quot;)
-end</code></pre><p>The possible valid elements in the iteration specification are</p><ul><li>Any node in the (PO)MDP Dynamic Decision network (by default <code>:s</code>, <code>:a</code>, <code>:sp</code>, <code>:o</code>, <code>:r</code>)</li><li><code>b</code> - the initial belief in the step (for POMDPs only)</li><li><code>bp</code> - the belief after being updated based on <code>o</code> (for POMDPs only)</li><li><code>action_info</code> - info from the policy decision (from <code>action_info</code>)</li><li><code>update_info</code> - info from the belief update (from <code>update_info</code>)</li><li><code>t</code> - the timestep index</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/history.jl#L96-L125">source</a></section></article><h4 id="Examples:"><a class="docs-heading-anchor" href="#Examples:">Examples:</a><a id="Examples:-1"></a><a class="docs-heading-anchor-permalink" href="#Examples:" title="Permalink"></a></h4><pre><code class="language-julia hljs">collect(eachstep(h, &quot;a,o&quot;))</code></pre><p>will produce a vector of action-observation named tuples.</p><pre><code class="language-julia hljs">collect(norm(sp-s) for (s,sp) in eachstep(h, &quot;s,sp&quot;))</code></pre><p>will produce a vector of the distances traveled on each step (assuming the state is a Euclidean vector).</p><h4 id="Notes"><a class="docs-heading-anchor" href="#Notes">Notes</a><a id="Notes-1"></a><a class="docs-heading-anchor-permalink" href="#Notes" title="Permalink"></a></h4><ul><li>The iteration specification can be specified as a tuple of symbols (e.g. <code>(:s, :a)</code>) instead of a string.</li><li>For type stability in performance-critical code, one should construct an iterator directly using <code>HistoryIterator{typeof(h), (:a,:r)}(h)</code> rather than <code>eachstep(h, &quot;ar&quot;)</code>.</li></ul><h3 id="Other-Functions"><a class="docs-heading-anchor" href="#Other-Functions">Other Functions</a><a id="Other-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Other-Functions" title="Permalink"></a></h3><p><code>state_hist(h)</code>, <code>action_hist(h)</code>, <code>observation_hist(h)</code> <code>belief_hist(h)</code>, and <code>reward_hist(h)</code> will return vectors of the states, actions, and rewards, and <code>undiscounted_reward(h)</code> and <code>discounted_reward(h)</code> will return the total rewards collected over the trajectory. <code>n_steps(h)</code> returns the number of steps in the history. <code>exception(h)</code> and <code>backtrace(h)</code> can be used to hold an exception if the simulation failed to finish.</p><p><code>view(h, range)</code> (e.g. <code>view(h, 1:n_steps(h)-4)</code>) can be used to create a view of the history object <code>h</code> that only contains a certain range of steps. The object returned by <code>view</code> is an <code>AbstractSimHistory</code> that can be iterated through and manipulated just like a complete <code>SimHistory</code>.</p><h2 id="Parallel"><a class="docs-heading-anchor" href="#Parallel">Parallel</a><a id="Parallel-1"></a><a class="docs-heading-anchor-permalink" href="#Parallel" title="Permalink"></a></h2><p>POMDPTools contains a utility for running many Monte Carlo simulations in parallel to evaluate performance. The basic workflow involves the following steps:</p><ol><li>Create a vector of <a href="#POMDPTools.Simulators.Sim"><code>Sim</code></a> objects, each specifying how a single simulation should be run.</li><li>Use the <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a> or <a href="#Base.run"><code>run</code></a> function to run the simulations.</li><li>Analyze the results of the simulations contained in the <a href="https://github.com/JuliaData/DataFrames.jl"><code>DataFrame</code></a> returned by <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a>.</li></ol><h3 id="Example"><a class="docs-heading-anchor" href="#Example">Example</a><a id="Example-1"></a><a class="docs-heading-anchor-permalink" href="#Example" title="Permalink"></a></h3><p>An example can be found in the <a href="../../example_simulations/#Parallel-Simulations">Parallel Simulations</a> section.</p><h3 id="Sim-objects"><a class="docs-heading-anchor" href="#Sim-objects">Sim objects</a><a id="Sim-objects-1"></a><a class="docs-heading-anchor-permalink" href="#Sim-objects" title="Permalink"></a></h3><p>Each simulation should be specified by a <a href="#POMDPTools.Simulators.Sim"><code>Sim</code></a> object which contains all the information needed to run a simulation, including the <code>Simulator</code>, <code>POMDP</code> or <code>MDP</code>, <code>Policy</code>, <code>Updater</code>, and any other ingredients.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.Sim" href="#POMDPTools.Simulators.Sim"><code>POMDPTools.Simulators.Sim</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">Sim(m::MDP, p::Policy[, initialstate]; kwargs...)
-Sim(m::POMDP, p::Policy[, updater[, initial_belief[, initialstate]]]; kwargs...)</code></pre><p>Create a Sim object that contains everything needed to run and record a single simulation, including model, initial conditions, and metadata.</p><p>A vector of <code>Sim</code> objects can be executed with <a href="#Base.run"><code>run</code></a> or <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a>.</p><p><strong>Keyword Arguments</strong></p><ul><li><code>rng::AbstractRNG=Random.default_rng()</code></li><li><code>max_steps::Int=typemax(Int)</code></li><li><code>simulator::Simulator=HistoryRecorder(rng=rng, max_steps=max_steps)</code></li><li><code>metadata::NamedTuple a named tuple (or dictionary) of metadata for the sim that will be recorded, e.g.</code>(solver_iterations=500,)`.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/parallel.jl#L1-L14">source</a></section></article><h3 id="Running-simulations"><a class="docs-heading-anchor" href="#Running-simulations">Running simulations</a><a id="Running-simulations-1"></a><a class="docs-heading-anchor-permalink" href="#Running-simulations" title="Permalink"></a></h3><p>The simulations are actually carried out by the <code>run</code> and <code>run_parallel</code> functions.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.run_parallel" href="#POMDPTools.Simulators.run_parallel"><code>POMDPTools.Simulators.run_parallel</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">run_parallel(queue::Vector{Sim})
+end</code></pre><p>The possible valid elements in the iteration specification are</p><ul><li>Any node in the (PO)MDP Dynamic Decision network (by default <code>:s</code>, <code>:a</code>, <code>:sp</code>, <code>:o</code>, <code>:r</code>)</li><li><code>b</code> - the initial belief in the step (for POMDPs only)</li><li><code>bp</code> - the belief after being updated based on <code>o</code> (for POMDPs only)</li><li><code>action_info</code> - info from the policy decision (from <code>action_info</code>)</li><li><code>update_info</code> - info from the belief update (from <code>update_info</code>)</li><li><code>t</code> - the timestep index</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/history.jl#L96-L125">source</a></section></article><h4 id="Examples:"><a class="docs-heading-anchor" href="#Examples:">Examples:</a><a id="Examples:-1"></a><a class="docs-heading-anchor-permalink" href="#Examples:" title="Permalink"></a></h4><pre><code class="language-julia hljs">collect(eachstep(h, &quot;a,o&quot;))</code></pre><p>will produce a vector of action-observation named tuples.</p><pre><code class="language-julia hljs">collect(norm(sp-s) for (s,sp) in eachstep(h, &quot;s,sp&quot;))</code></pre><p>will produce a vector of the distances traveled on each step (assuming the state is a Euclidean vector).</p><h4 id="Notes"><a class="docs-heading-anchor" href="#Notes">Notes</a><a id="Notes-1"></a><a class="docs-heading-anchor-permalink" href="#Notes" title="Permalink"></a></h4><ul><li>The iteration specification can be specified as a tuple of symbols (e.g. <code>(:s, :a)</code>) instead of a string.</li><li>For type stability in performance-critical code, one should construct an iterator directly using <code>HistoryIterator{typeof(h), (:a,:r)}(h)</code> rather than <code>eachstep(h, &quot;ar&quot;)</code>.</li></ul><h3 id="Other-Functions"><a class="docs-heading-anchor" href="#Other-Functions">Other Functions</a><a id="Other-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Other-Functions" title="Permalink"></a></h3><p><code>state_hist(h)</code>, <code>action_hist(h)</code>, <code>observation_hist(h)</code> <code>belief_hist(h)</code>, and <code>reward_hist(h)</code> will return vectors of the states, actions, and rewards, and <code>undiscounted_reward(h)</code> and <code>discounted_reward(h)</code> will return the total rewards collected over the trajectory. <code>n_steps(h)</code> returns the number of steps in the history. <code>exception(h)</code> and <code>backtrace(h)</code> can be used to hold an exception if the simulation failed to finish.</p><p><code>view(h, range)</code> (e.g. <code>view(h, 1:n_steps(h)-4)</code>) can be used to create a view of the history object <code>h</code> that only contains a certain range of steps. The object returned by <code>view</code> is an <code>AbstractSimHistory</code> that can be iterated through and manipulated just like a complete <code>SimHistory</code>.</p><h2 id="Parallel"><a class="docs-heading-anchor" href="#Parallel">Parallel</a><a id="Parallel-1"></a><a class="docs-heading-anchor-permalink" href="#Parallel" title="Permalink"></a></h2><p>POMDPTools contains a utility for running many Monte Carlo simulations in parallel to evaluate performance. The basic workflow involves the following steps:</p><ol><li>Create a vector of <a href="#POMDPTools.Simulators.Sim"><code>Sim</code></a> objects, each specifying how a single simulation should be run.</li><li>Use the <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a> or <a href="#Base.run"><code>run</code></a> function to run the simulations.</li><li>Analyze the results of the simulations contained in the <a href="https://github.com/JuliaData/DataFrames.jl"><code>DataFrame</code></a> returned by <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a>.</li></ol><h3 id="Example"><a class="docs-heading-anchor" href="#Example">Example</a><a id="Example-1"></a><a class="docs-heading-anchor-permalink" href="#Example" title="Permalink"></a></h3><p>An example can be found in the <a href="../../example_simulations/#Parallel-Simulations">Parallel Simulations</a> section.</p><h3 id="Sim-objects"><a class="docs-heading-anchor" href="#Sim-objects">Sim objects</a><a id="Sim-objects-1"></a><a class="docs-heading-anchor-permalink" href="#Sim-objects" title="Permalink"></a></h3><p>Each simulation should be specified by a <a href="#POMDPTools.Simulators.Sim"><code>Sim</code></a> object which contains all the information needed to run a simulation, including the <code>Simulator</code>, <code>POMDP</code> or <code>MDP</code>, <code>Policy</code>, <code>Updater</code>, and any other ingredients.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.Sim" href="#POMDPTools.Simulators.Sim"><code>POMDPTools.Simulators.Sim</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">Sim(m::MDP, p::Policy[, initialstate]; kwargs...)
+Sim(m::POMDP, p::Policy[, updater[, initial_belief[, initialstate]]]; kwargs...)</code></pre><p>Create a Sim object that contains everything needed to run and record a single simulation, including model, initial conditions, and metadata.</p><p>A vector of <code>Sim</code> objects can be executed with <a href="#Base.run"><code>run</code></a> or <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a>.</p><p><strong>Keyword Arguments</strong></p><ul><li><code>rng::AbstractRNG=Random.default_rng()</code></li><li><code>max_steps::Int=typemax(Int)</code></li><li><code>simulator::Simulator=HistoryRecorder(rng=rng, max_steps=max_steps)</code></li><li><code>metadata::NamedTuple a named tuple (or dictionary) of metadata for the sim that will be recorded, e.g.</code>(solver_iterations=500,)`.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/parallel.jl#L1-L14">source</a></section></article><h3 id="Running-simulations"><a class="docs-heading-anchor" href="#Running-simulations">Running simulations</a><a id="Running-simulations-1"></a><a class="docs-heading-anchor-permalink" href="#Running-simulations" title="Permalink"></a></h3><p>The simulations are actually carried out by the <code>run</code> and <code>run_parallel</code> functions.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.run_parallel" href="#POMDPTools.Simulators.run_parallel"><code>POMDPTools.Simulators.run_parallel</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">run_parallel(queue::Vector{Sim})
 run_parallel(f::Function, queue::Vector{Sim})</code></pre><p>Run <code>Sim</code> objects in <code>queue</code> in parallel and return results as a <code>DataFrame</code>.</p><p>By default, the <code>DataFrame</code> will contain the reward for each simulation and the metadata provided to the sim.</p><p><strong>Arguments</strong></p><ul><li><code>queue</code>: List of <code>Sim</code> objects to be executed</li><li><code>f</code>: Function to process the results of each simulation</li></ul><p>This function should take two arguments, (1) the <code>Sim</code> that was executed and (2) the result of the simulation, by default a <code>SimHistory</code>. It should return a named tuple that will appear in the dataframe. See Examples below.</p><p><strong>Keyword Arguments</strong></p><ul><li><code>show_progress::Bool</code>: whether or not to show a progress meter</li><li><code>progress::ProgressMeter.Progress</code>: determines how the progress meter is displayed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia hljs">run_parallel(queue) do sim, hist
     return (n_steps=n_steps(hist), reward=discounted_reward(hist))
-end</code></pre><p>will return a dataframe with with the number of steps and the reward in it.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/parallel.jl#L95-L120">source</a></section></article><p>The <code>run</code> function is also provided to run simulations in serial (this is often useful for debugging). Note that the documentation below also contains a section for the builtin julia <code>run</code> function, even though it is not relevant here.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.run" href="#Base.run"><code>Base.run</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">run(queue::Vector{Sim})
-run(f::Function, queue::Vector{Sim})</code></pre><p>Run the <code>Sim</code> objects in <code>queue</code> on a single process and return the results as a dataframe.</p><p>See <code>run_parallel</code> for more information.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/parallel.jl#L155-L162">source</a></section></article><h3 id="Specifying-information-to-be-recorded"><a class="docs-heading-anchor" href="#Specifying-information-to-be-recorded">Specifying information to be recorded</a><a id="Specifying-information-to-be-recorded-1"></a><a class="docs-heading-anchor-permalink" href="#Specifying-information-to-be-recorded" title="Permalink"></a></h3><p>By default, only the discounted rewards from each simulation are recorded, but arbitrary information can be recorded.</p><p>The <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a> and <a href="#Base.run"><code>run</code></a> functions accept a function (normally specified via the <a href="https://docs.julialang.org/en/v1/manual/functions/#Do-Block-Syntax-for-Function-Arguments-1"><code>do</code> syntax</a>) that takes the <a href="#POMDPTools.Simulators.Sim"><code>Sim</code></a> object and <a href="#Histories">history</a> of the simulation and extracts relevant statistics as a named tuple. For example, if the desired characteristics are the number of steps in the simulation and the reward, <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a> would be invoked as follows:</p><pre><code class="language-julia hljs">df = run_parallel(queue) do sim::Sim, hist::SimHistory
+end</code></pre><p>will return a dataframe with with the number of steps and the reward in it.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/parallel.jl#L95-L120">source</a></section></article><p>The <code>run</code> function is also provided to run simulations in serial (this is often useful for debugging). Note that the documentation below also contains a section for the builtin julia <code>run</code> function, even though it is not relevant here.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.run" href="#Base.run"><code>Base.run</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">run(queue::Vector{Sim})
+run(f::Function, queue::Vector{Sim})</code></pre><p>Run the <code>Sim</code> objects in <code>queue</code> on a single process and return the results as a dataframe.</p><p>See <code>run_parallel</code> for more information.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/parallel.jl#L155-L162">source</a></section></article><h3 id="Specifying-information-to-be-recorded"><a class="docs-heading-anchor" href="#Specifying-information-to-be-recorded">Specifying information to be recorded</a><a id="Specifying-information-to-be-recorded-1"></a><a class="docs-heading-anchor-permalink" href="#Specifying-information-to-be-recorded" title="Permalink"></a></h3><p>By default, only the discounted rewards from each simulation are recorded, but arbitrary information can be recorded.</p><p>The <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a> and <a href="#Base.run"><code>run</code></a> functions accept a function (normally specified via the <a href="https://docs.julialang.org/en/v1/manual/functions/#Do-Block-Syntax-for-Function-Arguments-1"><code>do</code> syntax</a>) that takes the <a href="#POMDPTools.Simulators.Sim"><code>Sim</code></a> object and <a href="#Histories">history</a> of the simulation and extracts relevant statistics as a named tuple. For example, if the desired characteristics are the number of steps in the simulation and the reward, <a href="#POMDPTools.Simulators.run_parallel"><code>run_parallel</code></a> would be invoked as follows:</p><pre><code class="language-julia hljs">df = run_parallel(queue) do sim::Sim, hist::SimHistory
     return (n_steps=n_steps(hist), reward=discounted_reward(hist))
 end</code></pre><p>These statistics are combined into a <a href="https://github.com/JuliaData/DataFrames.jl"><code>DataFrame</code></a>, with each line representing a single simulation, allowing for statistical analysis. For example,</p><pre><code class="language-julia hljs">mean(df[:reward]./df[:n_steps])</code></pre><p>would compute the average reward per step with each simulation weighted equally regardless of length.</p><h2 id="Display"><a class="docs-heading-anchor" href="#Display">Display</a><a id="Display-1"></a><a class="docs-heading-anchor-permalink" href="#Display" title="Permalink"></a></h2><h3 id="DisplaySimulator"><a class="docs-heading-anchor" href="#DisplaySimulator"><code>DisplaySimulator</code></a><a id="DisplaySimulator-1"></a><a class="docs-heading-anchor-permalink" href="#DisplaySimulator" title="Permalink"></a></h3><p>The <code>DisplaySimulator</code> displays each step of a simulation in real time through a multimedia display such as a Jupyter notebook or <a href="https://github.com/queryverse/ElectronDisplay.jl">ElectronDisplay</a>. Specifically it uses <a href="../visualization/#POMDPTools.ModelTools.render"><code>POMDPTools.render</code></a> and the built-in Julia <a href="https://docs.julialang.org/en/v1/base/io-network/#Base.Multimedia.display"><code>display</code> function</a> to visualize each step.</p><p>Example:</p><pre><code class="language-julia hljs">using POMDPs
 using POMDPModels
@@ -77,4 +77,4 @@
 m = SimpleGridWorld()
 simulate(ds, m, RandomPolicy(m))</code></pre><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Simulators.DisplaySimulator" href="#POMDPTools.Simulators.DisplaySimulator"><code>POMDPTools.Simulators.DisplaySimulator</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">DisplaySimulator(;kwargs...)</code></pre><p>Create a simulator that displays each step of a simulation.</p><p>Given a POMDP or MDP model <code>m</code>, this simulator roughly works like</p><pre><code class="nohighlight hljs">for step in stepthrough(m, ...)
     display(render(m, step))
-end</code></pre><p><strong>Keyword Arguments</strong></p><ul><li><code>display::AbstractDisplay</code>: the display to use for the first argument to the <code>display</code> function. If this is <code>nothing</code>, <code>display(...)</code> will be called without an <code>AbstractDisplay</code> argument.</li><li><code>render_kwargs::NamedTuple</code>: keyword arguments for <code>POMDPTools.render(...)</code></li><li><code>max_fps::Number=10</code>: maximum number of frames to be displayed per second - <code>sleep</code> will be used to skip extra time, so this is not designed for high precision</li><li><code>predisplay::Function</code>: function to call before every call to <code>display(...)</code>. The only argument to this function will be the display (if it is specified) or <code>nothing</code></li><li><code>extra_initial::Bool=false</code>: if <code>true</code>, display an extra step at the beginning with only elements <code>t</code>, <code>sp</code>, and <code>bp</code> for POMDPs (this can be useful to see the initial state if <code>render</code> displays only <code>sp</code> and not <code>s</code>).</li><li><code>extra_final</code>::Bool=true<code>: if</code>true<code>, display an extra step at the end with only elements</code>t<code>,</code>done<code>,</code>s<code>, and</code>b<code>for POMDPs (this can be useful to see the final state if</code>render<code>displays only</code>s<code>and not</code>sp`).</li><li><code>max_steps::Integer</code>: maximum number of steps to run for</li><li><code>spec::NTuple{Symbol}</code>: specification of what step elements to display (see <code>eachstep</code>)</li><li><code>rng::AbstractRNG</code>: random number generator</li></ul><p>See the POMDPSimulators documentation for more tips about using specific displays.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Simulators/display.jl#L11-L34">source</a></section></article><h3 id="Display-specific-tips"><a class="docs-heading-anchor" href="#Display-specific-tips">Display-specific tips</a><a id="Display-specific-tips-1"></a><a class="docs-heading-anchor-permalink" href="#Display-specific-tips" title="Permalink"></a></h3><p>The following tips may be helpful when using particular displays.</p><h4 id="Jupyter-notebooks"><a class="docs-heading-anchor" href="#Jupyter-notebooks">Jupyter notebooks</a><a id="Jupyter-notebooks-1"></a><a class="docs-heading-anchor-permalink" href="#Jupyter-notebooks" title="Permalink"></a></h4><p>By default, in a Jupyter notebook, the visualizations of all steps are displayed in the output box one after another. To make the output animated instead, where the image is overwritten at each step, one may use</p><pre><code class="language-julia hljs">DisplaySimulator(predisplay=(d)-&gt;IJulia.clear_output(true))</code></pre><h4 id="ElectronDisplay"><a class="docs-heading-anchor" href="#ElectronDisplay">ElectronDisplay</a><a id="ElectronDisplay-1"></a><a class="docs-heading-anchor-permalink" href="#ElectronDisplay" title="Permalink"></a></h4><p>By default, ElectronDisplay will open a new window for each new step. To prevent this, use</p><pre><code class="language-julia hljs">ElectronDisplay.CONFIG.single_window = true</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../policies/">« Implemented Policies</a><a class="docs-footer-nextpage" href="../common_rl/">CommonRLInterface Integration »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+end</code></pre><p><strong>Keyword Arguments</strong></p><ul><li><code>display::AbstractDisplay</code>: the display to use for the first argument to the <code>display</code> function. If this is <code>nothing</code>, <code>display(...)</code> will be called without an <code>AbstractDisplay</code> argument.</li><li><code>render_kwargs::NamedTuple</code>: keyword arguments for <code>POMDPTools.render(...)</code></li><li><code>max_fps::Number=10</code>: maximum number of frames to be displayed per second - <code>sleep</code> will be used to skip extra time, so this is not designed for high precision</li><li><code>predisplay::Function</code>: function to call before every call to <code>display(...)</code>. The only argument to this function will be the display (if it is specified) or <code>nothing</code></li><li><code>extra_initial::Bool=false</code>: if <code>true</code>, display an extra step at the beginning with only elements <code>t</code>, <code>sp</code>, and <code>bp</code> for POMDPs (this can be useful to see the initial state if <code>render</code> displays only <code>sp</code> and not <code>s</code>).</li><li><code>extra_final</code>::Bool=true<code>: if</code>true<code>, display an extra step at the end with only elements</code>t<code>,</code>done<code>,</code>s<code>, and</code>b<code>for POMDPs (this can be useful to see the final state if</code>render<code>displays only</code>s<code>and not</code>sp`).</li><li><code>max_steps::Integer</code>: maximum number of steps to run for</li><li><code>spec::NTuple{Symbol}</code>: specification of what step elements to display (see <code>eachstep</code>)</li><li><code>rng::AbstractRNG</code>: random number generator</li></ul><p>See the POMDPSimulators documentation for more tips about using specific displays.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Simulators/display.jl#L11-L34">source</a></section></article><h3 id="Display-specific-tips"><a class="docs-heading-anchor" href="#Display-specific-tips">Display-specific tips</a><a id="Display-specific-tips-1"></a><a class="docs-heading-anchor-permalink" href="#Display-specific-tips" title="Permalink"></a></h3><p>The following tips may be helpful when using particular displays.</p><h4 id="Jupyter-notebooks"><a class="docs-heading-anchor" href="#Jupyter-notebooks">Jupyter notebooks</a><a id="Jupyter-notebooks-1"></a><a class="docs-heading-anchor-permalink" href="#Jupyter-notebooks" title="Permalink"></a></h4><p>By default, in a Jupyter notebook, the visualizations of all steps are displayed in the output box one after another. To make the output animated instead, where the image is overwritten at each step, one may use</p><pre><code class="language-julia hljs">DisplaySimulator(predisplay=(d)-&gt;IJulia.clear_output(true))</code></pre><h4 id="ElectronDisplay"><a class="docs-heading-anchor" href="#ElectronDisplay">ElectronDisplay</a><a id="ElectronDisplay-1"></a><a class="docs-heading-anchor-permalink" href="#ElectronDisplay" title="Permalink"></a></h4><p>By default, ElectronDisplay will open a new window for each new step. To prevent this, use</p><pre><code class="language-julia hljs">ElectronDisplay.CONFIG.single_window = true</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../policies/">« Implemented Policies</a><a class="docs-footer-nextpage" href="../common_rl/">CommonRLInterface Integration »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/testing/index.html b/dev/POMDPTools/testing/index.html
index fd25d638..581fc45b 100644
--- a/dev/POMDPTools/testing/index.html
+++ b/dev/POMDPTools/testing/index.html
@@ -1,8 +1,8 @@
 <!DOCTYPE html>
 <html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Testing · POMDPs.jl</title><meta name="title" content="Testing · POMDPs.jl"/><meta property="og:title" content="Testing · POMDPs.jl"/><meta property="twitter:title" content="Testing · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li><a class="tocitem" href="../visualization/">Visualization</a></li><li><a class="tocitem" href="../beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../policies/">Implemented Policies</a></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li class="is-active"><a class="tocitem" href>Testing</a><ul class="internal"><li><a class="tocitem" href="#Testing-(PO)MDP-Models"><span>Testing (PO)MDP Models</span></a></li><li><a class="tocitem" href="#Testing-Solvers"><span>Testing Solvers</span></a></li></ul></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Testing</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Testing</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/testing.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Testing"><a class="docs-heading-anchor" href="#Testing">Testing</a><a id="Testing-1"></a><a class="docs-heading-anchor-permalink" href="#Testing" title="Permalink"></a></h1><p>POMDPTools contains basic utilities for testing models and solvers.</p><h2 id="Testing-(PO)MDP-Models"><a class="docs-heading-anchor" href="#Testing-(PO)MDP-Models">Testing (PO)MDP Models</a><a id="Testing-(PO)MDP-Models-1"></a><a class="docs-heading-anchor-permalink" href="#Testing-(PO)MDP-Models" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.has_consistent_distributions" href="#POMDPTools.Testing.has_consistent_distributions"><code>POMDPTools.Testing.has_consistent_distributions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">has_consistent_distributions(m::MDP; atol=0)
-has_consistent_distributions(m::POMDP; atol=0)</code></pre><p>Return true if no problems are found in the distributions for a discrete problem. Print information and return false if problems are found.</p><p>Tests whether</p><ul><li>All probabilities are positive</li><li>Probabilities for all distributions sum to 1</li><li>All items with positive probability are in the support</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>atol</code>: absolute tolerance passed to <code>approx</code> for all probability checks</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Testing/model.jl#L1-L14">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.has_consistent_initial_distribution" href="#POMDPTools.Testing.has_consistent_initial_distribution"><code>POMDPTools.Testing.has_consistent_initial_distribution</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">has_consistent_initial_distribution(m; atol=0)</code></pre><p>Return true if no problems are found with the initial state distribution for a discrete problem. Print information and return false if problems are found.</p><p>See <code>has_consistent_distributions</code> for information on what checks are performed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Testing/model.jl#L114-L120">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.has_consistent_transition_distributions" href="#POMDPTools.Testing.has_consistent_transition_distributions"><code>POMDPTools.Testing.has_consistent_transition_distributions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">has_consistent_transition_distributions(m; atol=0)</code></pre><p>Return true if no problems are found in the transition distributions for a discrete problem. Print information and return false if problems are found.</p><p>See <code>has_consistent_distributions</code> for information on what checks are performed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Testing/model.jl#L28-L34">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.has_consistent_observation_distributions" href="#POMDPTools.Testing.has_consistent_observation_distributions"><code>POMDPTools.Testing.has_consistent_observation_distributions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">has_consistent_observation_distributions(m; atol=0)</code></pre><p>Return true if no problems are found in the observation distributions for a discrete POMDP. Print information and return false if problems are found.</p><p>See <code>has_consistent_distributions</code> for information on what checks are performed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Testing/model.jl#L70-L76">source</a></section></article><h2 id="Testing-Solvers"><a class="docs-heading-anchor" href="#Testing-Solvers">Testing Solvers</a><a id="Testing-Solvers-1"></a><a class="docs-heading-anchor-permalink" href="#Testing-Solvers" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.test_solver" href="#POMDPTools.Testing.test_solver"><code>POMDPTools.Testing.test_solver</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">test_solver(solver::Solver, problem::POMDP)
+has_consistent_distributions(m::POMDP; atol=0)</code></pre><p>Return true if no problems are found in the distributions for a discrete problem. Print information and return false if problems are found.</p><p>Tests whether</p><ul><li>All probabilities are positive</li><li>Probabilities for all distributions sum to 1</li><li>All items with positive probability are in the support</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>atol</code>: absolute tolerance passed to <code>approx</code> for all probability checks</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Testing/model.jl#L1-L14">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.has_consistent_initial_distribution" href="#POMDPTools.Testing.has_consistent_initial_distribution"><code>POMDPTools.Testing.has_consistent_initial_distribution</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">has_consistent_initial_distribution(m; atol=0)</code></pre><p>Return true if no problems are found with the initial state distribution for a discrete problem. Print information and return false if problems are found.</p><p>See <code>has_consistent_distributions</code> for information on what checks are performed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Testing/model.jl#L114-L120">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.has_consistent_transition_distributions" href="#POMDPTools.Testing.has_consistent_transition_distributions"><code>POMDPTools.Testing.has_consistent_transition_distributions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">has_consistent_transition_distributions(m; atol=0)</code></pre><p>Return true if no problems are found in the transition distributions for a discrete problem. Print information and return false if problems are found.</p><p>See <code>has_consistent_distributions</code> for information on what checks are performed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Testing/model.jl#L28-L34">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.has_consistent_observation_distributions" href="#POMDPTools.Testing.has_consistent_observation_distributions"><code>POMDPTools.Testing.has_consistent_observation_distributions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">has_consistent_observation_distributions(m; atol=0)</code></pre><p>Return true if no problems are found in the observation distributions for a discrete POMDP. Print information and return false if problems are found.</p><p>See <code>has_consistent_distributions</code> for information on what checks are performed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Testing/model.jl#L70-L76">source</a></section></article><h2 id="Testing-Solvers"><a class="docs-heading-anchor" href="#Testing-Solvers">Testing Solvers</a><a id="Testing-Solvers-1"></a><a class="docs-heading-anchor-permalink" href="#Testing-Solvers" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.Testing.test_solver" href="#POMDPTools.Testing.test_solver"><code>POMDPTools.Testing.test_solver</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">test_solver(solver::Solver, problem::POMDP)
 test_solver(solver::Solver, problem::MDP)</code></pre><p>Use the solver to solve the specified problem, then run a simulation.</p><p>This is designed to illustrate how solvers are expected to function. All solvers should be able to complete this standard test with the simple models in the POMDPModels package.</p><p>Note that this does NOT test the optimality of the solution, but is only a smoke test to see if the solver interacts with POMDP models as expected.</p><p>To run this with a solver called YourSolver, run</p><pre><code class="nohighlight hljs">using POMDPToolbox
 using POMDPModels
 
 solver = YourSolver(# initialize with parameters #)
-test_solver(solver, BabyPOMDP())</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/Testing/solver.jl#L59-L77">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../common_rl/">« CommonRLInterface Integration</a><a class="docs-footer-nextpage" href="../../faq/">Frequently Asked Questions (FAQ) »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+test_solver(solver, BabyPOMDP())</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/Testing/solver.jl#L59-L77">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../common_rl/">« CommonRLInterface Integration</a><a class="docs-footer-nextpage" href="../../faq/">Frequently Asked Questions (FAQ) »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/POMDPTools/visualization/index.html b/dev/POMDPTools/visualization/index.html
index 2f63d407..e483af07 100644
--- a/dev/POMDPTools/visualization/index.html
+++ b/dev/POMDPTools/visualization/index.html
@@ -1,7 +1,7 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Visualization · POMDPs.jl</title><meta name="title" content="Visualization · POMDPs.jl"/><meta property="og:title" content="Visualization · POMDPs.jl"/><meta property="twitter:title" content="Visualization · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li class="is-active"><a class="tocitem" href>Visualization</a></li><li><a class="tocitem" href="../beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../policies/">Implemented Policies</a></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Visualization</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Visualization</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/visualization.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Visualization"><a class="docs-heading-anchor" href="#Visualization">Visualization</a><a id="Visualization-1"></a><a class="docs-heading-anchor-permalink" href="#Visualization" title="Permalink"></a></h1><p>POMDPTools contains a basic visualization interface consisting of the <code>render</code> function.</p><p>Problem writers should implement a method of this function so that their problem can be visualized in a variety of contexts including jupyter notebooks, web browsers, or saved as images or animations.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.render" href="#POMDPTools.ModelTools.render"><code>POMDPTools.ModelTools.render</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">render(m::Union{MDP,POMDP}, step::NamedTuple)</code></pre><p>Return a renderable representation of the step in problem <code>m</code>.</p><p>The renderable representation may be anything that has <code>show(io, mime, x)</code> methods. It could be a plot, svg, Compose.jl context, Cairo context, or image.</p><p><strong>Arguments</strong></p><p><code>step</code> is a <code>NamedTuple</code> that contains the states, action, etc. corresponding to one transition in a simulation. It may have the following fields:</p><ul><li><code>t</code>: the time step index</li><li><code>s</code>: the state at the beginning of the step</li><li><code>a</code>: the action</li><li><code>sp</code>: the state at the end of the step (s&#39;)</li><li><code>r</code>: the reward for the step</li><li><code>o</code>: the observation</li><li><code>b</code>: the belief at the </li><li><code>bp</code>: the belief at the end of the step</li><li><code>i</code>: info from the model when the state transition was calculated</li><li><code>ai</code>: info from the policy decision</li><li><code>ui</code>: info from the belief update</li></ul><p>Keyword arguments are reserved for the problem implementer and can be used to control appearance, etc.</p><p><strong>Important Notes</strong></p><ul><li><code>step</code> may not contain all of the elements listed above, so <code>render</code> should check for them and render only what is available</li><li><code>o</code> typically corresponds to <code>sp</code>, so it is often clearer for POMDPs to render <code>sp</code> rather than <code>s</code>.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/lib/POMDPTools/src/ModelTools/visualization.jl#L1-L29">source</a></section></article><p>Sometimes it is important to have control over how the problem is rendered with different mimetypes. One way to handle this is to have render return a custom type, e.g.</p><pre><code class="language-julia hljs">struct MyProblemVisualization
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Visualization · POMDPs.jl</title><meta name="title" content="Visualization · POMDPs.jl"/><meta property="og:title" content="Visualization · POMDPs.jl"/><meta property="twitter:title" content="Visualization · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../../">POMDPs.jl</a></li><li><a class="tocitem" href="../../install/">Installation</a></li><li><a class="tocitem" href="../../get_started/">Getting Started</a></li><li><a class="tocitem" href="../../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../../def_solver/">Solvers</a></li><li><a class="tocitem" href="../../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../../examples/">Examples</a></li><li><a class="tocitem" href="../../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../model/">Model Tools</a></li><li class="is-active"><a class="tocitem" href>Visualization</a></li><li><a class="tocitem" href="../beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../policies/">Implemented Policies</a></li><li><a class="tocitem" href="../simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">POMDPTools</a></li><li class="is-active"><a href>Visualization</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Visualization</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/POMDPTools/visualization.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Visualization"><a class="docs-heading-anchor" href="#Visualization">Visualization</a><a id="Visualization-1"></a><a class="docs-heading-anchor-permalink" href="#Visualization" title="Permalink"></a></h1><p>POMDPTools contains a basic visualization interface consisting of the <code>render</code> function.</p><p>Problem writers should implement a method of this function so that their problem can be visualized in a variety of contexts including jupyter notebooks, web browsers, or saved as images or animations.</p><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPTools.ModelTools.render" href="#POMDPTools.ModelTools.render"><code>POMDPTools.ModelTools.render</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">render(m::Union{MDP,POMDP}, step::NamedTuple)</code></pre><p>Return a renderable representation of the step in problem <code>m</code>.</p><p>The renderable representation may be anything that has <code>show(io, mime, x)</code> methods. It could be a plot, svg, Compose.jl context, Cairo context, or image.</p><p><strong>Arguments</strong></p><p><code>step</code> is a <code>NamedTuple</code> that contains the states, action, etc. corresponding to one transition in a simulation. It may have the following fields:</p><ul><li><code>t</code>: the time step index</li><li><code>s</code>: the state at the beginning of the step</li><li><code>a</code>: the action</li><li><code>sp</code>: the state at the end of the step (s&#39;)</li><li><code>r</code>: the reward for the step</li><li><code>o</code>: the observation</li><li><code>b</code>: the belief at the </li><li><code>bp</code>: the belief at the end of the step</li><li><code>i</code>: info from the model when the state transition was calculated</li><li><code>ai</code>: info from the policy decision</li><li><code>ui</code>: info from the belief update</li></ul><p>Keyword arguments are reserved for the problem implementer and can be used to control appearance, etc.</p><p><strong>Important Notes</strong></p><ul><li><code>step</code> may not contain all of the elements listed above, so <code>render</code> should check for them and render only what is available</li><li><code>o</code> typically corresponds to <code>sp</code>, so it is often clearer for POMDPs to render <code>sp</code> rather than <code>s</code>.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/lib/POMDPTools/src/ModelTools/visualization.jl#L1-L29">source</a></section></article><p>Sometimes it is important to have control over how the problem is rendered with different mimetypes. One way to handle this is to have render return a custom type, e.g.</p><pre><code class="language-julia hljs">struct MyProblemVisualization
     mdp::MyProblem
     step::NamedTuple
 end
 
-POMDPTools.render(mdp, step) = MyProblemVisualization(mdp, step)</code></pre><p>and then implement custom <code>show</code> methods, e.g.</p><pre><code class="language-julia hljs">show(io::IO, mime::MIME&quot;text/html&quot;, v::MyProblemVisualization)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../model/">« Model Tools</a><a class="docs-footer-nextpage" href="../beliefs/">Implemented Belief Updaters »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+POMDPTools.render(mdp, step) = MyProblemVisualization(mdp, step)</code></pre><p>and then implement custom <code>show</code> methods, e.g.</p><pre><code class="language-julia hljs">show(io::IO, mime::MIME&quot;text/html&quot;, v::MyProblemVisualization)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../model/">« Model Tools</a><a class="docs-footer-nextpage" href="../beliefs/">Implemented Belief Updaters »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/api/index.html b/dev/api/index.html
index 7f31c667..388f0410 100644
--- a/dev/api/index.html
+++ b/dev/api/index.html
@@ -1,36 +1,36 @@
 <!DOCTYPE html>
 <html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>API Documentation · POMDPs.jl</title><meta name="title" content="API Documentation · POMDPs.jl"/><meta property="og:title" content="API Documentation · POMDPs.jl"/><meta property="twitter:title" content="API Documentation · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li class="is-active"><a class="tocitem" href>API Documentation</a><ul class="internal"><li><a class="tocitem" href="#Contents"><span>Contents</span></a></li><li><a class="tocitem" href="#Index"><span>Index</span></a></li><li><a class="tocitem" href="#Types"><span>Types</span></a></li><li><a class="tocitem" href="#Model-Functions"><span>Model Functions</span></a></li><li><a class="tocitem" href="#Belief-Functions"><span>Belief Functions</span></a></li><li><a class="tocitem" href="#Policy-and-Solver-Functions"><span>Policy and Solver Functions</span></a></li><li><a class="tocitem" href="#Simulator"><span>Simulator</span></a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>API Documentation</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>API Documentation</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/api.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="API-Documentation"><a class="docs-heading-anchor" href="#API-Documentation">API Documentation</a><a id="API-Documentation-1"></a><a class="docs-heading-anchor-permalink" href="#API-Documentation" title="Permalink"></a></h1><p>Docstrings for POMDPs.jl interface members can be <a href="https://docs.julialang.org/en/v1/manual/documentation/index.html#Accessing-Documentation-1">accessed through Julia&#39;s built-in documentation system</a> or in the list below.</p><h2 id="Contents"><a class="docs-heading-anchor" href="#Contents">Contents</a><a id="Contents-1"></a><a class="docs-heading-anchor-permalink" href="#Contents" title="Permalink"></a></h2><ul><li><a href="#API-Documentation">API Documentation</a></li><li class="no-marker"><ul><li><a href="#Contents">Contents</a></li><li><a href="#Index">Index</a></li><li><a href="#Types">Types</a></li><li><a href="#Model-Functions">Model Functions</a></li><li><a href="#Belief-Functions">Belief Functions</a></li><li><a href="#Policy-and-Solver-Functions">Policy and Solver Functions</a></li><li><a href="#Simulator">Simulator</a></li></ul></li></ul><h2 id="Index"><a class="docs-heading-anchor" href="#Index">Index</a><a id="Index-1"></a><a class="docs-heading-anchor-permalink" href="#Index" title="Permalink"></a></h2><ul><li><a href="#POMDPs.MDP"><code>POMDPs.MDP</code></a></li><li><a href="#POMDPs.POMDP"><code>POMDPs.POMDP</code></a></li><li><a href="#POMDPs.Policy"><code>POMDPs.Policy</code></a></li><li><a href="#POMDPs.Simulator"><code>POMDPs.Simulator</code></a></li><li><a href="#POMDPs.Solver"><code>POMDPs.Solver</code></a></li><li><a href="#POMDPs.Updater"><code>POMDPs.Updater</code></a></li><li><a href="#Base.rand"><code>Base.rand</code></a></li><li><a href="#Distributions.pdf"><code>Distributions.pdf</code></a></li><li><a href="#Distributions.support"><code>Distributions.support</code></a></li><li><a href="#POMDPs.action"><code>POMDPs.action</code></a></li><li><a href="#POMDPs.actionindex"><code>POMDPs.actionindex</code></a></li><li><a href="#POMDPs.actions"><code>POMDPs.actions</code></a></li><li><a href="#POMDPs.actiontype"><code>POMDPs.actiontype</code></a></li><li><a href="#POMDPs.convert_a"><code>POMDPs.convert_a</code></a></li><li><a href="#POMDPs.convert_o"><code>POMDPs.convert_o</code></a></li><li><a href="#POMDPs.convert_s"><code>POMDPs.convert_s</code></a></li><li><a href="#POMDPs.currentobs"><code>POMDPs.currentobs</code></a></li><li><a href="#POMDPs.discount"><code>POMDPs.discount</code></a></li><li><a href="#POMDPs.gen"><code>POMDPs.gen</code></a></li><li><a href="#POMDPs.history"><code>POMDPs.history</code></a></li><li><a href="#POMDPs.initialize_belief"><code>POMDPs.initialize_belief</code></a></li><li><a href="#POMDPs.initialobs"><code>POMDPs.initialobs</code></a></li><li><a href="#POMDPs.initialstate"><code>POMDPs.initialstate</code></a></li><li><a href="#POMDPs.isterminal"><code>POMDPs.isterminal</code></a></li><li><a href="#POMDPs.observation"><code>POMDPs.observation</code></a></li><li><a href="#POMDPs.observations"><code>POMDPs.observations</code></a></li><li><a href="#POMDPs.obsindex"><code>POMDPs.obsindex</code></a></li><li><a href="#POMDPs.obstype"><code>POMDPs.obstype</code></a></li><li><a href="#POMDPs.reward"><code>POMDPs.reward</code></a></li><li><a href="#POMDPs.simulate"><code>POMDPs.simulate</code></a></li><li><a href="#POMDPs.solve"><code>POMDPs.solve</code></a></li><li><a href="#POMDPs.stateindex"><code>POMDPs.stateindex</code></a></li><li><a href="#POMDPs.states"><code>POMDPs.states</code></a></li><li><a href="#POMDPs.statetype"><code>POMDPs.statetype</code></a></li><li><a href="#POMDPs.transition"><code>POMDPs.transition</code></a></li><li><a href="#POMDPs.update"><code>POMDPs.update</code></a></li><li><a href="#POMDPs.updater"><code>POMDPs.updater</code></a></li><li><a href="#POMDPs.value"><code>POMDPs.value</code></a></li><li><a href="#Statistics.mean"><code>Statistics.mean</code></a></li><li><a href="#StatsBase.mode"><code>StatsBase.mode</code></a></li><li><a href="#POMDPs.@gen"><code>POMDPs.@gen</code></a></li></ul><h2 id="Types"><a class="docs-heading-anchor" href="#Types">Types</a><a id="Types-1"></a><a class="docs-heading-anchor-permalink" href="#Types" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.POMDP" href="#POMDPs.POMDP"><code>POMDPs.POMDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">POMDP{S,A,O}</code></pre><p>Abstract base type for a partially observable Markov decision process.</p><pre><code class="nohighlight hljs">S: state type
 A: action type
-O: observation type</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L2-L10">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.MDP" href="#POMDPs.MDP"><code>POMDPs.MDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">MDP{S,A}</code></pre><p>Abstract base type for a fully observable Markov decision process.</p><pre><code class="nohighlight hljs">S: state type
-A: action type</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L13-L20">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Solver" href="#POMDPs.Solver"><code>POMDPs.Solver</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Base type for an MDP/POMDP solver</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/solver.jl#L2-L4">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Policy" href="#POMDPs.Policy"><code>POMDPs.Policy</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Base type for a policy (a map from every possible belief, or more abstract policy state, to an optimal or suboptimal action)</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/policy.jl#L7-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Updater" href="#POMDPs.Updater"><code>POMDPs.Updater</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Abstract type for an object that defines how the belief should be updated</p><p>A belief is a general construct that represents the knowledge an agent has about the state of the system. This can be a probability distribution, an action observation history or a more general representation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/belief.jl#L7-L13">source</a></section></article><h2 id="Model-Functions"><a class="docs-heading-anchor" href="#Model-Functions">Model Functions</a><a id="Model-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Model-Functions" title="Permalink"></a></h2><h3 id="Dynamics"><a class="docs-heading-anchor" href="#Dynamics">Dynamics</a><a id="Dynamics-1"></a><a class="docs-heading-anchor-permalink" href="#Dynamics" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.transition" href="#POMDPs.transition"><code>POMDPs.transition</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">transition(m::POMDP, state, action)
-transition(m::MDP, state, action)</code></pre><p>Return the transition distribution from the current state-action pair.</p><p>If it is difficult to define the probability density or mass function explicitly, consider using <code>POMDPModelTools.ImplicitDistribution</code> to define a generative model.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L31-L38">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.observation" href="#POMDPs.observation"><code>POMDPs.observation</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observation(m::POMDP, statep)
+O: observation type</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L2-L10">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.MDP" href="#POMDPs.MDP"><code>POMDPs.MDP</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia hljs">MDP{S,A}</code></pre><p>Abstract base type for a fully observable Markov decision process.</p><pre><code class="nohighlight hljs">S: state type
+A: action type</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L13-L20">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Solver" href="#POMDPs.Solver"><code>POMDPs.Solver</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Base type for an MDP/POMDP solver</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/solver.jl#L2-L4">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Policy" href="#POMDPs.Policy"><code>POMDPs.Policy</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Base type for a policy (a map from every possible belief, or more abstract policy state, to an optimal or suboptimal action)</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/policy.jl#L7-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Updater" href="#POMDPs.Updater"><code>POMDPs.Updater</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Abstract type for an object that defines how the belief should be updated</p><p>A belief is a general construct that represents the knowledge an agent has about the state of the system. This can be a probability distribution, an action observation history or a more general representation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/belief.jl#L7-L13">source</a></section></article><h2 id="Model-Functions"><a class="docs-heading-anchor" href="#Model-Functions">Model Functions</a><a id="Model-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Model-Functions" title="Permalink"></a></h2><h3 id="Dynamics"><a class="docs-heading-anchor" href="#Dynamics">Dynamics</a><a id="Dynamics-1"></a><a class="docs-heading-anchor-permalink" href="#Dynamics" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.transition" href="#POMDPs.transition"><code>POMDPs.transition</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">transition(m::POMDP, state, action)
+transition(m::MDP, state, action)</code></pre><p>Return the transition distribution from the current state-action pair.</p><p>If it is difficult to define the probability density or mass function explicitly, consider using <code>POMDPModelTools.ImplicitDistribution</code> to define a generative model.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L31-L38">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.observation" href="#POMDPs.observation"><code>POMDPs.observation</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observation(m::POMDP, statep)
 observation(m::POMDP, action, statep)
 observation(m::POMDP, state, action, statep)</code></pre><p>Return the observation distribution. You need only define the method with the fewest arguments needed to determine the observation distribution.</p><p>If it is difficult to define the probability density or mass function explicitly, consider using <code>POMDPModelTools.ImplicitDistribution</code> to define a generative model.</p><p><strong>Example</strong></p><pre><code class="language-julia hljs">using POMDPModelTools # for SparseCat
 
 struct MyPOMDP &lt;: POMDP{Int, Int, Int} end
 
-observation(p::MyPOMDP, sp::Int) = SparseCat([sp-1, sp, sp+1], [0.1, 0.8, 0.1])</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L41-L58">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.reward" href="#POMDPs.reward"><code>POMDPs.reward</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward(m::POMDP, s, a)
+observation(p::MyPOMDP, sp::Int) = SparseCat([sp-1, sp, sp+1], [0.1, 0.8, 0.1])</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L41-L58">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.reward" href="#POMDPs.reward"><code>POMDPs.reward</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">reward(m::POMDP, s, a)
 reward(m::MDP, s, a)</code></pre><p>Return the immediate reward for the s-a pair.</p><pre><code class="nohighlight hljs">reward(m::POMDP, s, a, sp)
-reward(m::MDP, s, a, sp)</code></pre><p>Return the immediate reward for the s-a-s&#39; triple</p><pre><code class="nohighlight hljs">reward(m::POMDP, s, a, sp, o)</code></pre><p>Return the immediate reward for the s-a-s&#39;-o quad</p><p>For some problems, it is easier to express <code>reward(m, s, a, sp)</code> or <code>reward(m, s, a, sp, o)</code>, than <code>reward(m, s, a)</code>, but some solvers, e.g. SARSOP, can only use <code>reward(m, s, a)</code>. Both can be implemented for a problem, but when <code>reward(m, s, a)</code> is implemented, it should be consistent with <code>reward(m, s, a, sp[, o])</code>, that is, it should be the expected value over all destination states and observations.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L67-L83">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.gen" href="#POMDPs.gen"><code>POMDPs.gen</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">gen(m::Union{MDP,POMDP}, s, a, rng::AbstractRNG)</code></pre><p>Function for implementing the entire MDP/POMDP generative model by returning a <code>NamedTuple</code>.</p><p><code>gen</code> should <em>only</em> be implemented in the case where <em>two or more</em> of the next state, observation, and reward need to be generated at the same time. If the state transition model can be separated from the reward and observation models, you should implement <code>transition</code> with an <code>ImplicitDistribution</code> instead of <code>gen</code>.</p><p>Solver and simulator writers should use the <code>@gen</code> macro to call a generative model.</p><p><strong>Arguments</strong></p><ul><li><code>m</code>: an <code>MDP</code> or <code>POMDP</code> model</li><li><code>s</code>: the current state</li><li><code>a</code>: the action</li><li><code>rng</code>: a random number generator (Typically a <code>MersenneTwister</code>)</li></ul><p><strong>Return</strong></p><p>The function should return a <a href="https://docs.julialang.org/en/v1/base/base/#Core.NamedTuple"><code>NamedTuple</code></a>. With a subset of following entries:</p><p><strong>MDP</strong></p><ul><li><code>sp</code>: the next state</li><li><code>r</code>: the reward for the step</li><li><code>info</code>: extra debugging information, typically in an associative container like a NamedTuple</li></ul><p><strong>POMDP</strong></p><ul><li><code>sp</code>: the next state</li><li><code>o</code>: the observation</li><li><code>r</code>: the reward for the step</li><li><code>info</code>: extra debugging information, typically in an associative container like a NamedTuple</li></ul><p>Some elements can be left out. For instance if <code>o</code> is left out of the return, the problem-writer can also implement <code>observation</code> and POMDPs.jl will automatically use it when needed.</p><p><strong>Example</strong></p><pre><code class="language-julia hljs">struct LQRMDP &lt;: MDP{Float64, Float64} end
+reward(m::MDP, s, a, sp)</code></pre><p>Return the immediate reward for the s-a-s&#39; triple</p><pre><code class="nohighlight hljs">reward(m::POMDP, s, a, sp, o)</code></pre><p>Return the immediate reward for the s-a-s&#39;-o quad</p><p>For some problems, it is easier to express <code>reward(m, s, a, sp)</code> or <code>reward(m, s, a, sp, o)</code>, than <code>reward(m, s, a)</code>, but some solvers, e.g. SARSOP, can only use <code>reward(m, s, a)</code>. Both can be implemented for a problem, but when <code>reward(m, s, a)</code> is implemented, it should be consistent with <code>reward(m, s, a, sp[, o])</code>, that is, it should be the expected value over all destination states and observations.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L67-L83">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.gen" href="#POMDPs.gen"><code>POMDPs.gen</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">gen(m::Union{MDP,POMDP}, s, a, rng::AbstractRNG)</code></pre><p>Function for implementing the entire MDP/POMDP generative model by returning a <code>NamedTuple</code>.</p><p><code>gen</code> should <em>only</em> be implemented in the case where <em>two or more</em> of the next state, observation, and reward need to be generated at the same time. If the state transition model can be separated from the reward and observation models, you should implement <code>transition</code> with an <code>ImplicitDistribution</code> instead of <code>gen</code>.</p><p>Solver and simulator writers should use the <code>@gen</code> macro to call a generative model.</p><p><strong>Arguments</strong></p><ul><li><code>m</code>: an <code>MDP</code> or <code>POMDP</code> model</li><li><code>s</code>: the current state</li><li><code>a</code>: the action</li><li><code>rng</code>: a random number generator (Typically a <code>MersenneTwister</code>)</li></ul><p><strong>Return</strong></p><p>The function should return a <a href="https://docs.julialang.org/en/v1/base/base/#Core.NamedTuple"><code>NamedTuple</code></a>. With a subset of following entries:</p><p><strong>MDP</strong></p><ul><li><code>sp</code>: the next state</li><li><code>r</code>: the reward for the step</li><li><code>info</code>: extra debugging information, typically in an associative container like a NamedTuple</li></ul><p><strong>POMDP</strong></p><ul><li><code>sp</code>: the next state</li><li><code>o</code>: the observation</li><li><code>r</code>: the reward for the step</li><li><code>info</code>: extra debugging information, typically in an associative container like a NamedTuple</li></ul><p>Some elements can be left out. For instance if <code>o</code> is left out of the return, the problem-writer can also implement <code>observation</code> and POMDPs.jl will automatically use it when needed.</p><p><strong>Example</strong></p><pre><code class="language-julia hljs">struct LQRMDP &lt;: MDP{Float64, Float64} end
 
-POMDPs.gen(m::LQRMDP, s, a, rng) = (sp = s + a + randn(rng), r = -s^2 - a^2)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/generative.jl#L1-L38">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.@gen" href="#POMDPs.@gen"><code>POMDPs.@gen</code></a> — <span class="docstring-category">Macro</span></header><section><div><pre><code class="language-julia hljs">@gen(X)(m, s, a)
-@gen(X)(m, s, a, rng::AbstractRNG)</code></pre><p>Call the generative model for a (PO)MDP <code>m</code>; Sample values from several nodes in the dynamic decision network. X is one or more symbols indicating which nodes to output.</p><p>Solvers and simulators should call this rather than the <code>gen</code> function. Problem writers should implement a method of the <code>transition</code> or <code>gen</code> function instead of altering <code>@gen</code>.</p><p><strong>Arguments</strong></p><ul><li><code>m</code>: an <code>MDP</code> or <code>POMDP</code> model</li><li><code>s</code>: the current state</li><li><code>a</code>: the action</li><li><code>rng</code> (optional): a random number generator (Typically a <code>MersenneTwister</code>)</li></ul><p><strong>Return</strong></p><p>If <code>X</code>, is a symbol, return a value sample from the corresponding node. If <code>X</code> is several symbols, return a <code>Tuple</code> of values sampled from the specified nodes.</p><p><strong>Examples</strong></p><p>Let <code>m</code> be an <code>MDP</code> or <code>POMDP</code>, <code>s</code> be a state of <code>m</code>, <code>a</code> be an action of <code>m</code>, and <code>rng</code> be an <code>AbstractRNG</code>.</p><ul><li><code>@gen(:sp, :r)(m, s, a)</code> returns a <code>Tuple</code> containing the next state and reward.</li><li><code>@gen(:sp, :o, :r)(m, s, a, rng)</code> returns a <code>Tuple</code> containing the next state, observation, and reward.</li><li><code>@gen(:sp)(m, s, a, rng)</code> returns the next state.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/generative.jl#L41-L63">source</a></section></article><h3 id="Static-Properties"><a class="docs-heading-anchor" href="#Static-Properties">Static Properties</a><a id="Static-Properties-1"></a><a class="docs-heading-anchor-permalink" href="#Static-Properties" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.states" href="#POMDPs.states"><code>POMDPs.states</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">states(problem::POMDP)
-states(problem::MDP)</code></pre><p>Returns the complete state space of a POMDP. </p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/space.jl#L5-L10">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.actions" href="#POMDPs.actions"><code>POMDPs.actions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">actions(m::Union{MDP,POMDP})</code></pre><p>Returns the entire action space of a (PO)MDP.</p><hr/><pre><code class="nohighlight hljs">actions(m::Union{MDP,POMDP}, s)</code></pre><p>Return the actions that can be taken from state <code>s</code>.</p><hr/><pre><code class="nohighlight hljs">actions(m::POMDP, b)</code></pre><p>Return the actions that can be taken from belief <code>b</code>.</p><p>To implement an observation-dependent action space, use <code>currentobs(b)</code> to get the observation associated with belief <code>b</code> within the implementation of <code>actions(m, b)</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/space.jl#L13-L29">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.observations" href="#POMDPs.observations"><code>POMDPs.observations</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observations(problem::POMDP)</code></pre><p>Return the entire observation space.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/space.jl#L35-L39">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.isterminal" href="#POMDPs.isterminal"><code>POMDPs.isterminal</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">isterminal(m::Union{MDP,POMDP}, s)</code></pre><p>Check if state <code>s</code> is terminal.</p><p>If a state is terminal, no actions will be taken in it and no additional rewards will be accumulated. Thus, the value function at such a state is, by definition, zero.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L92-L98">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.discount" href="#POMDPs.discount"><code>POMDPs.discount</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">discount(m::POMDP)
-discount(m::MDP)</code></pre><p>Return the discount factor for the problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L23-L28">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.initialstate" href="#POMDPs.initialstate"><code>POMDPs.initialstate</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">initialstate(m::Union{POMDP,MDP})</code></pre><p>Return a distribution of initial states for (PO)MDP <code>m</code>.</p><p>If it is difficult to define the probability density or mass function explicitly, consider using <code>POMDPModelTools.ImplicitDistribution</code> to define a model for sampling.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L101-L107">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.initialobs" href="#POMDPs.initialobs"><code>POMDPs.initialobs</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">initialobs(m::POMDP, s)</code></pre><p>Return a distribution of initial observations for POMDP <code>m</code> and state <code>s</code>.</p><p>If it is difficult to define the probability density or mass function explicitly, consider using <code>POMDPModelTools.ImplicitDistribution</code> to define a model for sampling.</p><p>This function is only used in cases where the policy expects an initial observation rather than an initial belief, e.g. in a reinforcement learning setting. It is not used in a standard POMDP simulation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L110-L118">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.stateindex" href="#POMDPs.stateindex"><code>POMDPs.stateindex</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">stateindex(problem::POMDP, s)
-stateindex(problem::MDP, s)</code></pre><p>Return the integer index of state <code>s</code>. Used for discrete models only.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L122-L127">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.actionindex" href="#POMDPs.actionindex"><code>POMDPs.actionindex</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">actionindex(problem::POMDP, a)
-actionindex(problem::MDP, a)</code></pre><p>Return the integer index of action <code>a</code>. Used for discrete models only.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L130-L135">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.obsindex" href="#POMDPs.obsindex"><code>POMDPs.obsindex</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">obsindex(problem::POMDP, o)</code></pre><p>Return the integer index of observation <code>o</code>. Used for discrete models only.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L138-L142">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.convert_s" href="#POMDPs.convert_s"><code>POMDPs.convert_s</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">convert_s(::Type{V}, s, problem::Union{MDP,POMDP}) where V&lt;:AbstractArray
-convert_s(::Type{S}, vec::V, problem::Union{MDP,POMDP}) where {S,V&lt;:AbstractArray}</code></pre><p>Convert a state to vectorized form or vice versa.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L145-L150">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.convert_a" href="#POMDPs.convert_a"><code>POMDPs.convert_a</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">convert_a(::Type{V}, a, problem::Union{MDP,POMDP}) where V&lt;:AbstractArray
-convert_a(::Type{A}, vec::V, problem::Union{MDP,POMDP}) where {A,V&lt;:AbstractArray}</code></pre><p>Convert an action to vectorized form or vice versa.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L162-L167">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.convert_o" href="#POMDPs.convert_o"><code>POMDPs.convert_o</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">convert_o(::Type{V}, o, problem::Union{MDP,POMDP}) where V&lt;:AbstractArray
-convert_o(::Type{O}, vec::V, problem::Union{MDP,POMDP}) where {O,V&lt;:AbstractArray}</code></pre><p>Convert an observation to vectorized form or vice versa.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/pomdp.jl#L179-L184">source</a></section></article><h3 id="Type-Inference"><a class="docs-heading-anchor" href="#Type-Inference">Type Inference</a><a id="Type-Inference-1"></a><a class="docs-heading-anchor-permalink" href="#Type-Inference" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.statetype" href="#POMDPs.statetype"><code>POMDPs.statetype</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">statetype(t::Type)
+POMDPs.gen(m::LQRMDP, s, a, rng) = (sp = s + a + randn(rng), r = -s^2 - a^2)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/generative.jl#L1-L38">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.@gen" href="#POMDPs.@gen"><code>POMDPs.@gen</code></a> — <span class="docstring-category">Macro</span></header><section><div><pre><code class="language-julia hljs">@gen(X)(m, s, a)
+@gen(X)(m, s, a, rng::AbstractRNG)</code></pre><p>Call the generative model for a (PO)MDP <code>m</code>; Sample values from several nodes in the dynamic decision network. X is one or more symbols indicating which nodes to output.</p><p>Solvers and simulators should call this rather than the <code>gen</code> function. Problem writers should implement a method of the <code>transition</code> or <code>gen</code> function instead of altering <code>@gen</code>.</p><p><strong>Arguments</strong></p><ul><li><code>m</code>: an <code>MDP</code> or <code>POMDP</code> model</li><li><code>s</code>: the current state</li><li><code>a</code>: the action</li><li><code>rng</code> (optional): a random number generator (Typically a <code>MersenneTwister</code>)</li></ul><p><strong>Return</strong></p><p>If <code>X</code>, is a symbol, return a value sample from the corresponding node. If <code>X</code> is several symbols, return a <code>Tuple</code> of values sampled from the specified nodes.</p><p><strong>Examples</strong></p><p>Let <code>m</code> be an <code>MDP</code> or <code>POMDP</code>, <code>s</code> be a state of <code>m</code>, <code>a</code> be an action of <code>m</code>, and <code>rng</code> be an <code>AbstractRNG</code>.</p><ul><li><code>@gen(:sp, :r)(m, s, a)</code> returns a <code>Tuple</code> containing the next state and reward.</li><li><code>@gen(:sp, :o, :r)(m, s, a, rng)</code> returns a <code>Tuple</code> containing the next state, observation, and reward.</li><li><code>@gen(:sp)(m, s, a, rng)</code> returns the next state.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/generative.jl#L41-L63">source</a></section></article><h3 id="Static-Properties"><a class="docs-heading-anchor" href="#Static-Properties">Static Properties</a><a id="Static-Properties-1"></a><a class="docs-heading-anchor-permalink" href="#Static-Properties" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.states" href="#POMDPs.states"><code>POMDPs.states</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">states(problem::POMDP)
+states(problem::MDP)</code></pre><p>Returns the complete state space of a POMDP. </p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/space.jl#L5-L10">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.actions" href="#POMDPs.actions"><code>POMDPs.actions</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">actions(m::Union{MDP,POMDP})</code></pre><p>Returns the entire action space of a (PO)MDP.</p><hr/><pre><code class="nohighlight hljs">actions(m::Union{MDP,POMDP}, s)</code></pre><p>Return the actions that can be taken from state <code>s</code>.</p><hr/><pre><code class="nohighlight hljs">actions(m::POMDP, b)</code></pre><p>Return the actions that can be taken from belief <code>b</code>.</p><p>To implement an observation-dependent action space, use <code>currentobs(b)</code> to get the observation associated with belief <code>b</code> within the implementation of <code>actions(m, b)</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/space.jl#L13-L29">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.observations" href="#POMDPs.observations"><code>POMDPs.observations</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">observations(problem::POMDP)</code></pre><p>Return the entire observation space.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/space.jl#L35-L39">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.isterminal" href="#POMDPs.isterminal"><code>POMDPs.isterminal</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">isterminal(m::Union{MDP,POMDP}, s)</code></pre><p>Check if state <code>s</code> is terminal.</p><p>If a state is terminal, no actions will be taken in it and no additional rewards will be accumulated. Thus, the value function at such a state is, by definition, zero.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L92-L98">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.discount" href="#POMDPs.discount"><code>POMDPs.discount</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">discount(m::POMDP)
+discount(m::MDP)</code></pre><p>Return the discount factor for the problem.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L23-L28">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.initialstate" href="#POMDPs.initialstate"><code>POMDPs.initialstate</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">initialstate(m::Union{POMDP,MDP})</code></pre><p>Return a distribution of initial states for (PO)MDP <code>m</code>.</p><p>If it is difficult to define the probability density or mass function explicitly, consider using <code>POMDPModelTools.ImplicitDistribution</code> to define a model for sampling.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L101-L107">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.initialobs" href="#POMDPs.initialobs"><code>POMDPs.initialobs</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">initialobs(m::POMDP, s)</code></pre><p>Return a distribution of initial observations for POMDP <code>m</code> and state <code>s</code>.</p><p>If it is difficult to define the probability density or mass function explicitly, consider using <code>POMDPModelTools.ImplicitDistribution</code> to define a model for sampling.</p><p>This function is only used in cases where the policy expects an initial observation rather than an initial belief, e.g. in a reinforcement learning setting. It is not used in a standard POMDP simulation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L110-L118">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.stateindex" href="#POMDPs.stateindex"><code>POMDPs.stateindex</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">stateindex(problem::POMDP, s)
+stateindex(problem::MDP, s)</code></pre><p>Return the integer index of state <code>s</code>. Used for discrete models only.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L122-L127">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.actionindex" href="#POMDPs.actionindex"><code>POMDPs.actionindex</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">actionindex(problem::POMDP, a)
+actionindex(problem::MDP, a)</code></pre><p>Return the integer index of action <code>a</code>. Used for discrete models only.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L130-L135">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.obsindex" href="#POMDPs.obsindex"><code>POMDPs.obsindex</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">obsindex(problem::POMDP, o)</code></pre><p>Return the integer index of observation <code>o</code>. Used for discrete models only.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L138-L142">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.convert_s" href="#POMDPs.convert_s"><code>POMDPs.convert_s</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">convert_s(::Type{V}, s, problem::Union{MDP,POMDP}) where V&lt;:AbstractArray
+convert_s(::Type{S}, vec::V, problem::Union{MDP,POMDP}) where {S,V&lt;:AbstractArray}</code></pre><p>Convert a state to vectorized form or vice versa.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L145-L150">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.convert_a" href="#POMDPs.convert_a"><code>POMDPs.convert_a</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">convert_a(::Type{V}, a, problem::Union{MDP,POMDP}) where V&lt;:AbstractArray
+convert_a(::Type{A}, vec::V, problem::Union{MDP,POMDP}) where {A,V&lt;:AbstractArray}</code></pre><p>Convert an action to vectorized form or vice versa.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L162-L167">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.convert_o" href="#POMDPs.convert_o"><code>POMDPs.convert_o</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">convert_o(::Type{V}, o, problem::Union{MDP,POMDP}) where V&lt;:AbstractArray
+convert_o(::Type{O}, vec::V, problem::Union{MDP,POMDP}) where {O,V&lt;:AbstractArray}</code></pre><p>Convert an observation to vectorized form or vice versa.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/pomdp.jl#L179-L184">source</a></section></article><h3 id="Type-Inference"><a class="docs-heading-anchor" href="#Type-Inference">Type Inference</a><a id="Type-Inference-1"></a><a class="docs-heading-anchor-permalink" href="#Type-Inference" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.statetype" href="#POMDPs.statetype"><code>POMDPs.statetype</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">statetype(t::Type)
 statetype(p::Union{POMDP,MDP})</code></pre><p>Return the state type for a problem type (the <code>S</code> in <code>POMDP{S,A,O}</code>).</p><pre><code class="nohighlight hljs">type A &lt;: POMDP{Int, Bool, Bool} end
 
-statetype(A) # returns Int</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/type_inferrence.jl#L2-L13">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.actiontype" href="#POMDPs.actiontype"><code>POMDPs.actiontype</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">actiontype(t::Type)
+statetype(A) # returns Int</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/type_inferrence.jl#L2-L13">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.actiontype" href="#POMDPs.actiontype"><code>POMDPs.actiontype</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">actiontype(t::Type)
 actiontype(p::Union{POMDP,MDP})</code></pre><p>Return the state type for a problem type (the <code>S</code> in <code>POMDP{S,A,O}</code>).</p><pre><code class="nohighlight hljs">type A &lt;: POMDP{Bool, Int, Bool} end
 
-actiontype(A) # returns Int</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/type_inferrence.jl#L20-L31">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.obstype" href="#POMDPs.obstype"><code>POMDPs.obstype</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">obstype(t::Type)</code></pre><p>Return the state type for a problem type (the <code>S</code> in <code>POMDP{S,A,O}</code>).</p><pre><code class="nohighlight hljs">type A &lt;: POMDP{Bool, Bool, Int} end
+actiontype(A) # returns Int</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/type_inferrence.jl#L20-L31">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.obstype" href="#POMDPs.obstype"><code>POMDPs.obstype</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">obstype(t::Type)</code></pre><p>Return the state type for a problem type (the <code>S</code> in <code>POMDP{S,A,O}</code>).</p><pre><code class="nohighlight hljs">type A &lt;: POMDP{Bool, Bool, Int} end
 
-obstype(A) # returns Int</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/type_inferrence.jl#L38-L48">source</a></section></article><h3 id="Distributions-and-Spaces"><a class="docs-heading-anchor" href="#Distributions-and-Spaces">Distributions and Spaces</a><a id="Distributions-and-Spaces-1"></a><a class="docs-heading-anchor-permalink" href="#Distributions-and-Spaces" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.rand" href="#Base.rand"><code>Base.rand</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">rand(rng::AbstractRNG, d::Any)</code></pre><p>Return a random element from distribution or space <code>d</code>.</p><p>If <code>d</code> is a state or transition distribution, the sample will be a state; if <code>d</code> is an action distribution, the sample will be an action or if <code>d</code> is an observation distribution, the sample will be an observation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/distribution.jl#L5-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Distributions.pdf" href="#Distributions.pdf"><code>Distributions.pdf</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">pdf(d::Any, x::Any)</code></pre><p>Evaluate the probability density of distribution <code>d</code> at sample <code>x</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/distribution.jl#L14-L18">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="StatsBase.mode" href="#StatsBase.mode"><code>StatsBase.mode</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">mode(d::Any)</code></pre><p>Return the most likely value in a distribution d.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/distribution.jl#L21-L25">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Statistics.mean" href="#Statistics.mean"><code>Statistics.mean</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">mean(d::Any)</code></pre><p>Return the mean of a distribution d.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/distribution.jl#L28-L32">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Distributions.support" href="#Distributions.support"><code>Distributions.support</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">support(d::Any)</code></pre><p>Return an iterable object containing the possible values that can be sampled from distribution d. Values with zero probability may be skipped.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/distribution.jl#L35-L39">source</a></section></article><h2 id="Belief-Functions"><a class="docs-heading-anchor" href="#Belief-Functions">Belief Functions</a><a id="Belief-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Belief-Functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.update" href="#POMDPs.update"><code>POMDPs.update</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">update(updater::Updater, belief_old, action, observation)</code></pre><p>Return a new instance of an updated belief given <code>belief_old</code> and the latest action and observation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/belief.jl#L17-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.initialize_belief" href="#POMDPs.initialize_belief"><code>POMDPs.initialize_belief</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">initialize_belief(updater::Updater,
+obstype(A) # returns Int</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/type_inferrence.jl#L38-L48">source</a></section></article><h3 id="Distributions-and-Spaces"><a class="docs-heading-anchor" href="#Distributions-and-Spaces">Distributions and Spaces</a><a id="Distributions-and-Spaces-1"></a><a class="docs-heading-anchor-permalink" href="#Distributions-and-Spaces" title="Permalink"></a></h3><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.rand" href="#Base.rand"><code>Base.rand</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">rand(rng::AbstractRNG, d::Any)</code></pre><p>Return a random element from distribution or space <code>d</code>.</p><p>If <code>d</code> is a state or transition distribution, the sample will be a state; if <code>d</code> is an action distribution, the sample will be an action or if <code>d</code> is an observation distribution, the sample will be an observation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/distribution.jl#L5-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Distributions.pdf" href="#Distributions.pdf"><code>Distributions.pdf</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">pdf(d::Any, x::Any)</code></pre><p>Evaluate the probability density of distribution <code>d</code> at sample <code>x</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/distribution.jl#L14-L18">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="StatsBase.mode" href="#StatsBase.mode"><code>StatsBase.mode</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">mode(d::Any)</code></pre><p>Return the most likely value in a distribution d.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/distribution.jl#L21-L25">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Statistics.mean" href="#Statistics.mean"><code>Statistics.mean</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">mean(d::Any)</code></pre><p>Return the mean of a distribution d.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/distribution.jl#L28-L32">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Distributions.support" href="#Distributions.support"><code>Distributions.support</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">support(d::Any)</code></pre><p>Return an iterable object containing the possible values that can be sampled from distribution d. Values with zero probability may be skipped.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/distribution.jl#L35-L39">source</a></section></article><h2 id="Belief-Functions"><a class="docs-heading-anchor" href="#Belief-Functions">Belief Functions</a><a id="Belief-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Belief-Functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.update" href="#POMDPs.update"><code>POMDPs.update</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">update(updater::Updater, belief_old, action, observation)</code></pre><p>Return a new instance of an updated belief given <code>belief_old</code> and the latest action and observation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/belief.jl#L17-L21">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.initialize_belief" href="#POMDPs.initialize_belief"><code>POMDPs.initialize_belief</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">initialize_belief(updater::Updater,
                      state_distribution::Any)
-initialize_belief(updater::Updater, belief::Any)</code></pre><p>Returns a belief that can be updated using <code>updater</code> that has similar distribution to <code>state_distribution</code> or <code>belief</code>.</p><p>The conversion may be lossy. This function is also idempotent, i.e. there is a default implementation that passes the belief through when it is already the correct type: <code>initialize_belief(updater::Updater, belief) = belief</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/belief.jl#L24-L35">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.history" href="#POMDPs.history"><code>POMDPs.history</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">history(b)</code></pre><p>Return the action-observation history associated with belief <code>b</code>.</p><p>The history should be an <code>AbstractVector</code>, <code>Tuple</code>, (or similar object that supports indexing with <code>end</code>) full of <code>NamedTuples</code> with keys <code>:a</code> and <code>:o</code>, i.e. <code>history(b)[end][:a]</code> should be the last action taken leading up to <code>b</code>, and <code>history(b)[end][:o]</code> should be the last observation received.</p><p>It is acceptable to return only part of the history if that is all that is available, but it should always end with the current observation. For example, it would be acceptable to return a structure containing only the last three observations in a length 3 <code>Vector{NamedTuple{(:o,),Tuple{O}}</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/belief.jl#L41-L49">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.currentobs" href="#POMDPs.currentobs"><code>POMDPs.currentobs</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">currentobs(b)</code></pre><p>Return the latest observation associated with belief <code>b</code>.</p><p>If a solver or updater implements <code>history(b)</code> for a belief type, <code>currentobs</code> has a default implementation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/belief.jl#L52-L58">source</a></section></article><h2 id="Policy-and-Solver-Functions"><a class="docs-heading-anchor" href="#Policy-and-Solver-Functions">Policy and Solver Functions</a><a id="Policy-and-Solver-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Policy-and-Solver-Functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.solve" href="#POMDPs.solve"><code>POMDPs.solve</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">solve(solver::Solver, problem::POMDP)</code></pre><p>Solves the POMDP using method associated with solver, and returns a policy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/solver.jl#L7-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.updater" href="#POMDPs.updater"><code>POMDPs.updater</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">updater(policy::Policy)</code></pre><p>Returns a default Updater appropriate for a belief type that policy <code>p</code> can use</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/policy.jl#L21-L25">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.action" href="#POMDPs.action"><code>POMDPs.action</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">action(policy::Policy, x)</code></pre><p>Returns the action that the policy deems best for the current state or belief, <code>x</code>.</p><p><code>x</code> is a generalized information state - can be a state in an MDP, a distribution in POMDP, or another specialized policy-dependent representation of the information needed to choose an action.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/policy.jl#L12-L18">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.value" href="#POMDPs.value"><code>POMDPs.value</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">value(p::Policy, s)
-value(p::Policy, s, a)</code></pre><p>Returns the utility value from policy <code>p</code> given the state (or belief), or state-action (or belief-action) pair.</p><p>The state-action version is commonly referred to as the Q-value.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/policy.jl#L28-L35">source</a></section></article><h2 id="Simulator"><a class="docs-heading-anchor" href="#Simulator">Simulator</a><a id="Simulator-1"></a><a class="docs-heading-anchor-permalink" href="#Simulator" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Simulator" href="#POMDPs.Simulator"><code>POMDPs.Simulator</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Base type for an object defining how simulations should be carried out.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/simulator.jl#L1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.simulate" href="#POMDPs.simulate"><code>POMDPs.simulate</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">simulate(sim::Simulator, m::POMDP, p::Policy, u::Updater=updater(p), b0=initialstate(m), s0=rand(b0))
-simulate(sim::Simulator, m::MDP, p::Policy, s0=rand(initialstate(m)))</code></pre><p>Run a simulation using the specified policy.</p><p>The return type is flexible and depends on the simulator. Simulations should adhere to the <a href="https://juliapomdp.github.io/POMDPs.jl/stable/simulation/#Simulation-Standard">Simulation Standard</a>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6113ea4c6131aed9943cf1ecb5d65360f2cd47fe/src/simulator.jl#L6-L13">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../faq/">« Frequently Asked Questions (FAQ)</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+initialize_belief(updater::Updater, belief::Any)</code></pre><p>Returns a belief that can be updated using <code>updater</code> that has similar distribution to <code>state_distribution</code> or <code>belief</code>.</p><p>The conversion may be lossy. This function is also idempotent, i.e. there is a default implementation that passes the belief through when it is already the correct type: <code>initialize_belief(updater::Updater, belief) = belief</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/belief.jl#L24-L35">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.history" href="#POMDPs.history"><code>POMDPs.history</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">history(b)</code></pre><p>Return the action-observation history associated with belief <code>b</code>.</p><p>The history should be an <code>AbstractVector</code>, <code>Tuple</code>, (or similar object that supports indexing with <code>end</code>) full of <code>NamedTuples</code> with keys <code>:a</code> and <code>:o</code>, i.e. <code>history(b)[end][:a]</code> should be the last action taken leading up to <code>b</code>, and <code>history(b)[end][:o]</code> should be the last observation received.</p><p>It is acceptable to return only part of the history if that is all that is available, but it should always end with the current observation. For example, it would be acceptable to return a structure containing only the last three observations in a length 3 <code>Vector{NamedTuple{(:o,),Tuple{O}}</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/belief.jl#L41-L49">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.currentobs" href="#POMDPs.currentobs"><code>POMDPs.currentobs</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">currentobs(b)</code></pre><p>Return the latest observation associated with belief <code>b</code>.</p><p>If a solver or updater implements <code>history(b)</code> for a belief type, <code>currentobs</code> has a default implementation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/belief.jl#L52-L58">source</a></section></article><h2 id="Policy-and-Solver-Functions"><a class="docs-heading-anchor" href="#Policy-and-Solver-Functions">Policy and Solver Functions</a><a id="Policy-and-Solver-Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Policy-and-Solver-Functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.solve" href="#POMDPs.solve"><code>POMDPs.solve</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">solve(solver::Solver, problem::POMDP)</code></pre><p>Solves the POMDP using method associated with solver, and returns a policy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/solver.jl#L7-L11">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.updater" href="#POMDPs.updater"><code>POMDPs.updater</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">updater(policy::Policy)</code></pre><p>Returns a default Updater appropriate for a belief type that policy <code>p</code> can use</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/policy.jl#L21-L25">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.action" href="#POMDPs.action"><code>POMDPs.action</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">action(policy::Policy, x)</code></pre><p>Returns the action that the policy deems best for the current state or belief, <code>x</code>.</p><p><code>x</code> is a generalized information state - can be a state in an MDP, a distribution in POMDP, or another specialized policy-dependent representation of the information needed to choose an action.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/policy.jl#L12-L18">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.value" href="#POMDPs.value"><code>POMDPs.value</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">value(p::Policy, s)
+value(p::Policy, s, a)</code></pre><p>Returns the utility value from policy <code>p</code> given the state (or belief), or state-action (or belief-action) pair.</p><p>The state-action version is commonly referred to as the Q-value.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/policy.jl#L28-L35">source</a></section></article><h2 id="Simulator"><a class="docs-heading-anchor" href="#Simulator">Simulator</a><a id="Simulator-1"></a><a class="docs-heading-anchor-permalink" href="#Simulator" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.Simulator" href="#POMDPs.Simulator"><code>POMDPs.Simulator</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Base type for an object defining how simulations should be carried out.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/simulator.jl#L1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="POMDPs.simulate" href="#POMDPs.simulate"><code>POMDPs.simulate</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia hljs">simulate(sim::Simulator, m::POMDP, p::Policy, u::Updater=updater(p), b0=initialstate(m), s0=rand(b0))
+simulate(sim::Simulator, m::MDP, p::Policy, s0=rand(initialstate(m)))</code></pre><p>Run a simulation using the specified policy.</p><p>The return type is flexible and depends on the simulator. Simulations should adhere to the <a href="https://juliapomdp.github.io/POMDPs.jl/stable/simulation/#Simulation-Standard">Simulation Standard</a>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/6ffa5648b2288d02e3c3086647aa150168a31d3d/src/simulator.jl#L6-L13">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../faq/">« Frequently Asked Questions (FAQ)</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/concepts/index.html b/dev/concepts/index.html
index 4282e097..81a06874 100644
--- a/dev/concepts/index.html
+++ b/dev/concepts/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Concepts and Architecture · POMDPs.jl</title><meta name="title" content="Concepts and Architecture · POMDPs.jl"/><meta property="og:title" content="Concepts and Architecture · POMDPs.jl"/><meta property="twitter:title" content="Concepts and Architecture · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li class="is-active"><a class="tocitem" href>Concepts and Architecture</a><ul class="internal"><li><a class="tocitem" href="#POMDPs-and-MDPs"><span>POMDPs and MDPs</span></a></li><li><a class="tocitem" href="#Beliefs-and-Updaters"><span>Beliefs and Updaters</span></a></li><li><a class="tocitem" href="#Solvers-and-Policies"><span>Solvers and Policies</span></a></li><li><a class="tocitem" href="#Simulators"><span>Simulators</span></a></li></ul></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Basics</a></li><li class="is-active"><a href>Concepts and Architecture</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Concepts and Architecture</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/concepts.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Concepts-and-Architecture"><a class="docs-heading-anchor" href="#Concepts-and-Architecture">Concepts and Architecture</a><a id="Concepts-and-Architecture-1"></a><a class="docs-heading-anchor-permalink" href="#Concepts-and-Architecture" title="Permalink"></a></h1><p>POMDPs.jl aims to coordinate the development of three software components: 1) a problem, 2) a solver, 3) an experiment. Each of these components has a set of abstract types associated with it and a set of functions that allow a user to define each component&#39;s behavior in a standardized way. An outline of the architecture is shown below.</p><p><img src="../figures/concepts.png" alt="concepts"/></p><p>The MDP and POMDP types are associated with the problem definition. The Solver and Policy types are associated with the solver or decision-making agent. Typically, the Updater type is also associated with the solver, but a solver may sometimes be used with an updater that was implemented separately. The Simulator type is associated with the experiment.</p><p>The code components of the POMDPs.jl ecosystem relevant to problems and solvers are shown below. The arrows represent the flow of information from the problems to the solvers. The figure shows the two interfaces that form POMDPs.jl - Explicit and Generative. Details about these interfaces can be found in the section on <a href="../def_pomdp/#defining_pomdps">Defining POMDPs</a>.</p><p><img src="../figures/interface_relationships.svg" alt="interface_relationships"/></p><h2 id="POMDPs-and-MDPs"><a class="docs-heading-anchor" href="#POMDPs-and-MDPs">POMDPs and MDPs</a><a id="POMDPs-and-MDPs-1"></a><a class="docs-heading-anchor-permalink" href="#POMDPs-and-MDPs" title="Permalink"></a></h2><p>An MDP is a mathematical framework for sequential decision making under uncertainty, and where all of the uncertainty arises from outcomes that are partially random and partially under the control of a decision maker. Mathematically, an MDP is a tuple <span>$(S,A,T,R,\gamma)$</span>, where <span>$S$</span> is the state space, <span>$A$</span> is the action space, <span>$T$</span> is a transition function defining the probability of transitioning to each state given the state and action at the previous time, and <span>$R$</span> is a reward function mapping every possible transition <span>$(s,a,s&#39;)$</span> to a real reward value. Finally, <span>$\gamma$</span> is a discount factor that defines the relative weighting of current and future rewards. For more information see a textbook such as [1]. In POMDPs.jl an MDP is represented by a concrete subtype of the <a href="../api/#POMDPs.MDP"><code>MDP</code></a> abstract type and a set of methods that define each of its components as described in the <a href="../def_pomdp/#defining_pomdps">problem definition section</a>.</p><p>A POMDP is a more general sequential decision making problem in which the agent is not sure what state they are in. The state is only partially observable by the decision making agent. Mathematically, a POMDP is a tuple <span>$(S,A,T,R,O,Z,\gamma)$</span> where <span>$S$</span>, <span>$A$</span>, <span>$T$</span>, <span>$R$</span>, and <span>$\gamma$</span> have the same meaning as in an MDP, <span>$O$</span> is the agent&#39;s observation space, and <span>$Z$</span> defines the probability of receiving each observation at a transition. In POMDPs.jl, a POMDP is represented by a concrete subtype of the <a href="../api/#POMDPs.POMDP"><code>POMDP</code></a> abstract type, and the methods described in the <a href="../def_pomdp/#defining_pomdps">problem definition section</a>.</p><p>POMDPs.jl contains additional functions for defining optional problem behavior such as an <a href="../def_pomdp/#Initial-state-distribution">initial state distribution</a> or <a href="../def_pomdp/#Terminal-states">terminal states</a>. More information can be found in the <a href="../def_pomdp/#defining_pomdps">Defining POMDPs</a> section.</p><h2 id="Beliefs-and-Updaters"><a class="docs-heading-anchor" href="#Beliefs-and-Updaters">Beliefs and Updaters</a><a id="Beliefs-and-Updaters-1"></a><a class="docs-heading-anchor-permalink" href="#Beliefs-and-Updaters" title="Permalink"></a></h2><p>In a POMDP domain, the decision-making agent does not have complete information about the state of the problem, so the agent can only make choices based on its &quot;belief&quot; about the state. In the POMDP literature, the term &quot;belief&quot; is typically defined to mean a probability distribution over all possible states of the system. However, in practice, the agent often makes decisions based on an incomplete or lossy record of past observations that has a structure much different from a probability distribution. For example, if the agent is represented by a finite-state controller, as is the case for Monte-Carlo Value Iteration [2], the belief is the controller state, which is a node in a graph. Another example is an agent represented by a recurrent neural network. In this case, the agent&#39;s belief is the state of the network. In order to accommodate a wide variety of decision-making approaches in POMDPs.jl, we use the term &quot;belief&quot; to denote the set of information that the agent makes a decision on, which could be an exact state distribution, an action-observation history, a set of weighted particles, or the examples mentioned before. In code, the belief can be represented by any built-in or user-defined type.</p><p>When an action is taken and a new observation is received, the belief is updated by the belief updater. In code, a belief updater is represented by a concrete subtype of the <a href="../api/#POMDPs.Updater"><code>Updater</code></a> abstract type, and the <a href="../api/#POMDPs.update"><code>update(updater, belief, action, observation)</code></a> function defines how the belief is updated when a new observation is received.</p><p>Although the agent may use a specialized belief structure to make decisions, the information initially given to the agent about the state of the problem is usually most conveniently represented as a state distribution, thus the <a href="../api/#POMDPs.initialize_belief"><code>initialize_belief</code></a> function is provided to convert a state distribution to a specialized belief structure that an updater can work with.</p><p>In many cases, the belief structure is closely related to the solution technique, so it will be implemented by the programmer who writes the solver. In other cases, the agent can use a variety of belief structures to make decisions, so a domain-specific updater implemented by the programmer that wrote the problem description may be appropriate. Finally, some advanced generic belief updaters such as particle filters may be implemented by a third party. The convenience function <a href="../api/#POMDPs.updater"><code>updater(policy)</code></a> can be used to get a suitable default updater for a policy, however many policies can work with other updaters.</p><p>For more information on implementing a belief updater, see <a href="../def_updater/#Defining-a-Belief-Updater">Defining a Belief Updater</a></p><h2 id="Solvers-and-Policies"><a class="docs-heading-anchor" href="#Solvers-and-Policies">Solvers and Policies</a><a id="Solvers-and-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Solvers-and-Policies" title="Permalink"></a></h2><p>Sequential decision making under uncertainty involves both online and offline calculations. In the broad sense, the term &quot;solver&quot; as used in the node in the figure at the top of the page refers to the software package that performs the calculations at both of these times. However, the code is broken up into two pieces, the solver that performs calculations offline and the policy that performs calculations online.</p><p>In the abstract, a policy is a mapping from every belief that an agent might take to an action. A policy is represented in code by a concrete subtype of the <a href="../api/#POMDPs.Policy"><code>Policy</code></a> abstract type. The programmer implements <a href="../api/#POMDPs.action"><code>action</code></a> to describe what computations need to be done online. For an online solver such as POMCP, all of the decision computation occurs within <a href="../api/#POMDPs.action"><code>action</code></a> while for an offline solver like SARSOP, there is very little computation within <a href="../api/#POMDPs.action"><code>action</code></a>. See <a href="../policy_interaction/#Interacting-with-Policies">Interacting with Policies</a> for more information.</p><p>The offline portion of the computation is carried out by the solver, which is represented by a concrete subtype of the <a href="../api/#POMDPs.Solver"><code>Solver</code></a> abstract type. Computations occur within the <a href="../api/#POMDPs.solve"><code>solve</code></a> function. For an offline solver like SARSOP, nearly all of the decision computation occurs within this function, but for some online solvers such as POMCP, <a href="../api/#POMDPs.solve"><code>solve</code></a> merely embeds the problem in the policy.</p><h2 id="Simulators"><a class="docs-heading-anchor" href="#Simulators">Simulators</a><a id="Simulators-1"></a><a class="docs-heading-anchor-permalink" href="#Simulators" title="Permalink"></a></h2><p>A simulator defines a way to run one or more simulations. It is represented by a concrete subtype of the <a href="../api/#Simulator"><code>Simulator</code></a> abstract type and the simulation is an implemention of <a href="../api/#POMDPs.simulate"><code>simulate</code></a>. Depending on the simulator, <a href="../api/#POMDPs.simulate"><code>simulate</code></a> may return a variety of data about the simulation, such as the discounted reward or the state history. All simulators should perform simulations consistent with the <a href="../simulation/#Simulation-Standard">Simulation Standard</a>.</p><p>[1] <em>Decision Making Under Uncertainty: Theory and Application</em> by Mykel J. Kochenderfer, MIT Press, 2015</p><p>[2] Bai, H., Hsu, D., &amp; Lee, W. S. (2014). Integrated perception and planning in the continuous space: A POMDP approach. The International Journal of Robotics Research, 33(9), 1288-1302</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../get_started/">« Getting Started</a><a class="docs-footer-nextpage" href="../def_pomdp/">Defining POMDPs and MDPs »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Concepts and Architecture · POMDPs.jl</title><meta name="title" content="Concepts and Architecture · POMDPs.jl"/><meta property="og:title" content="Concepts and Architecture · POMDPs.jl"/><meta property="twitter:title" content="Concepts and Architecture · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li class="is-active"><a class="tocitem" href>Concepts and Architecture</a><ul class="internal"><li><a class="tocitem" href="#POMDPs-and-MDPs"><span>POMDPs and MDPs</span></a></li><li><a class="tocitem" href="#Beliefs-and-Updaters"><span>Beliefs and Updaters</span></a></li><li><a class="tocitem" href="#Solvers-and-Policies"><span>Solvers and Policies</span></a></li><li><a class="tocitem" href="#Simulators"><span>Simulators</span></a></li></ul></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Basics</a></li><li class="is-active"><a href>Concepts and Architecture</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Concepts and Architecture</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/concepts.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Concepts-and-Architecture"><a class="docs-heading-anchor" href="#Concepts-and-Architecture">Concepts and Architecture</a><a id="Concepts-and-Architecture-1"></a><a class="docs-heading-anchor-permalink" href="#Concepts-and-Architecture" title="Permalink"></a></h1><p>POMDPs.jl aims to coordinate the development of three software components: 1) a problem, 2) a solver, 3) an experiment. Each of these components has a set of abstract types associated with it and a set of functions that allow a user to define each component&#39;s behavior in a standardized way. An outline of the architecture is shown below.</p><p><img src="../figures/concepts.png" alt="concepts"/></p><p>The MDP and POMDP types are associated with the problem definition. The Solver and Policy types are associated with the solver or decision-making agent. Typically, the Updater type is also associated with the solver, but a solver may sometimes be used with an updater that was implemented separately. The Simulator type is associated with the experiment.</p><p>The code components of the POMDPs.jl ecosystem relevant to problems and solvers are shown below. The arrows represent the flow of information from the problems to the solvers. The figure shows the two interfaces that form POMDPs.jl - Explicit and Generative. Details about these interfaces can be found in the section on <a href="../def_pomdp/#defining_pomdps">Defining POMDPs</a>.</p><p><img src="../figures/interface_relationships.svg" alt="interface_relationships"/></p><h2 id="POMDPs-and-MDPs"><a class="docs-heading-anchor" href="#POMDPs-and-MDPs">POMDPs and MDPs</a><a id="POMDPs-and-MDPs-1"></a><a class="docs-heading-anchor-permalink" href="#POMDPs-and-MDPs" title="Permalink"></a></h2><p>An MDP is a mathematical framework for sequential decision making under uncertainty, and where all of the uncertainty arises from outcomes that are partially random and partially under the control of a decision maker. Mathematically, an MDP is a tuple <span>$(S,A,T,R,\gamma)$</span>, where <span>$S$</span> is the state space, <span>$A$</span> is the action space, <span>$T$</span> is a transition function defining the probability of transitioning to each state given the state and action at the previous time, and <span>$R$</span> is a reward function mapping every possible transition <span>$(s,a,s&#39;)$</span> to a real reward value. Finally, <span>$\gamma$</span> is a discount factor that defines the relative weighting of current and future rewards. For more information see a textbook such as [1]. In POMDPs.jl an MDP is represented by a concrete subtype of the <a href="../api/#POMDPs.MDP"><code>MDP</code></a> abstract type and a set of methods that define each of its components as described in the <a href="../def_pomdp/#defining_pomdps">problem definition section</a>.</p><p>A POMDP is a more general sequential decision making problem in which the agent is not sure what state they are in. The state is only partially observable by the decision making agent. Mathematically, a POMDP is a tuple <span>$(S,A,T,R,O,Z,\gamma)$</span> where <span>$S$</span>, <span>$A$</span>, <span>$T$</span>, <span>$R$</span>, and <span>$\gamma$</span> have the same meaning as in an MDP, <span>$O$</span> is the agent&#39;s observation space, and <span>$Z$</span> defines the probability of receiving each observation at a transition. In POMDPs.jl, a POMDP is represented by a concrete subtype of the <a href="../api/#POMDPs.POMDP"><code>POMDP</code></a> abstract type, and the methods described in the <a href="../def_pomdp/#defining_pomdps">problem definition section</a>.</p><p>POMDPs.jl contains additional functions for defining optional problem behavior such as an <a href="../def_pomdp/#Initial-state-distribution">initial state distribution</a> or <a href="../def_pomdp/#Terminal-states">terminal states</a>. More information can be found in the <a href="../def_pomdp/#defining_pomdps">Defining POMDPs</a> section.</p><h2 id="Beliefs-and-Updaters"><a class="docs-heading-anchor" href="#Beliefs-and-Updaters">Beliefs and Updaters</a><a id="Beliefs-and-Updaters-1"></a><a class="docs-heading-anchor-permalink" href="#Beliefs-and-Updaters" title="Permalink"></a></h2><p>In a POMDP domain, the decision-making agent does not have complete information about the state of the problem, so the agent can only make choices based on its &quot;belief&quot; about the state. In the POMDP literature, the term &quot;belief&quot; is typically defined to mean a probability distribution over all possible states of the system. However, in practice, the agent often makes decisions based on an incomplete or lossy record of past observations that has a structure much different from a probability distribution. For example, if the agent is represented by a finite-state controller, as is the case for Monte-Carlo Value Iteration [2], the belief is the controller state, which is a node in a graph. Another example is an agent represented by a recurrent neural network. In this case, the agent&#39;s belief is the state of the network. In order to accommodate a wide variety of decision-making approaches in POMDPs.jl, we use the term &quot;belief&quot; to denote the set of information that the agent makes a decision on, which could be an exact state distribution, an action-observation history, a set of weighted particles, or the examples mentioned before. In code, the belief can be represented by any built-in or user-defined type.</p><p>When an action is taken and a new observation is received, the belief is updated by the belief updater. In code, a belief updater is represented by a concrete subtype of the <a href="../api/#POMDPs.Updater"><code>Updater</code></a> abstract type, and the <a href="../api/#POMDPs.update"><code>update(updater, belief, action, observation)</code></a> function defines how the belief is updated when a new observation is received.</p><p>Although the agent may use a specialized belief structure to make decisions, the information initially given to the agent about the state of the problem is usually most conveniently represented as a state distribution, thus the <a href="../api/#POMDPs.initialize_belief"><code>initialize_belief</code></a> function is provided to convert a state distribution to a specialized belief structure that an updater can work with.</p><p>In many cases, the belief structure is closely related to the solution technique, so it will be implemented by the programmer who writes the solver. In other cases, the agent can use a variety of belief structures to make decisions, so a domain-specific updater implemented by the programmer that wrote the problem description may be appropriate. Finally, some advanced generic belief updaters such as particle filters may be implemented by a third party. The convenience function <a href="../api/#POMDPs.updater"><code>updater(policy)</code></a> can be used to get a suitable default updater for a policy, however many policies can work with other updaters.</p><p>For more information on implementing a belief updater, see <a href="../def_updater/#Defining-a-Belief-Updater">Defining a Belief Updater</a></p><h2 id="Solvers-and-Policies"><a class="docs-heading-anchor" href="#Solvers-and-Policies">Solvers and Policies</a><a id="Solvers-and-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Solvers-and-Policies" title="Permalink"></a></h2><p>Sequential decision making under uncertainty involves both online and offline calculations. In the broad sense, the term &quot;solver&quot; as used in the node in the figure at the top of the page refers to the software package that performs the calculations at both of these times. However, the code is broken up into two pieces, the solver that performs calculations offline and the policy that performs calculations online.</p><p>In the abstract, a policy is a mapping from every belief that an agent might take to an action. A policy is represented in code by a concrete subtype of the <a href="../api/#POMDPs.Policy"><code>Policy</code></a> abstract type. The programmer implements <a href="../api/#POMDPs.action"><code>action</code></a> to describe what computations need to be done online. For an online solver such as POMCP, all of the decision computation occurs within <a href="../api/#POMDPs.action"><code>action</code></a> while for an offline solver like SARSOP, there is very little computation within <a href="../api/#POMDPs.action"><code>action</code></a>. See <a href="../policy_interaction/#Interacting-with-Policies">Interacting with Policies</a> for more information.</p><p>The offline portion of the computation is carried out by the solver, which is represented by a concrete subtype of the <a href="../api/#POMDPs.Solver"><code>Solver</code></a> abstract type. Computations occur within the <a href="../api/#POMDPs.solve"><code>solve</code></a> function. For an offline solver like SARSOP, nearly all of the decision computation occurs within this function, but for some online solvers such as POMCP, <a href="../api/#POMDPs.solve"><code>solve</code></a> merely embeds the problem in the policy.</p><h2 id="Simulators"><a class="docs-heading-anchor" href="#Simulators">Simulators</a><a id="Simulators-1"></a><a class="docs-heading-anchor-permalink" href="#Simulators" title="Permalink"></a></h2><p>A simulator defines a way to run one or more simulations. It is represented by a concrete subtype of the <a href="../api/#Simulator"><code>Simulator</code></a> abstract type and the simulation is an implemention of <a href="../api/#POMDPs.simulate"><code>simulate</code></a>. Depending on the simulator, <a href="../api/#POMDPs.simulate"><code>simulate</code></a> may return a variety of data about the simulation, such as the discounted reward or the state history. All simulators should perform simulations consistent with the <a href="../simulation/#Simulation-Standard">Simulation Standard</a>.</p><p>[1] <em>Decision Making Under Uncertainty: Theory and Application</em> by Mykel J. Kochenderfer, MIT Press, 2015</p><p>[2] Bai, H., Hsu, D., &amp; Lee, W. S. (2014). Integrated perception and planning in the continuous space: A POMDP approach. The International Journal of Robotics Research, 33(9), 1288-1302</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../get_started/">« Getting Started</a><a class="docs-footer-nextpage" href="../def_pomdp/">Defining POMDPs and MDPs »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/def_pomdp/index.html b/dev/def_pomdp/index.html
index 025a17fa..ced9a70b 100644
--- a/dev/def_pomdp/index.html
+++ b/dev/def_pomdp/index.html
@@ -196,4 +196,4 @@
 R = [-1. -100. 10.; 
      -1. 10. -100.]
 
-m = TabularPOMDP(T, R, O, 0.95)</code></pre><p>Here <code>T</code> is a <span>$|S| \times |A| \times |S|$</span> array representing the transition probabilities, with <code>T[sp, a, s]</code> <span>$= T(s&#39; | s, a)$</span>. Similarly, <code>O</code> is an <span>$|O| \times |A| \times |S|$</span> encoding the observation distribution with <code>O[o, a, sp]</code> <span>$= Z(o | a, s&#39;)$</span>, and <code>R</code> is a <span>$|S| \times |A|$</span> matrix that encodes the reward function. 0.95 is the discount factor.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../concepts/">« Concepts and Architecture</a><a class="docs-footer-nextpage" href="../interfaces/">Spaces and Distributions »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+m = TabularPOMDP(T, R, O, 0.95)</code></pre><p>Here <code>T</code> is a <span>$|S| \times |A| \times |S|$</span> array representing the transition probabilities, with <code>T[sp, a, s]</code> <span>$= T(s&#39; | s, a)$</span>. Similarly, <code>O</code> is an <span>$|O| \times |A| \times |S|$</span> encoding the observation distribution with <code>O[o, a, sp]</code> <span>$= Z(o | a, s&#39;)$</span>, and <code>R</code> is a <span>$|S| \times |A|$</span> matrix that encodes the reward function. 0.95 is the discount factor.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../concepts/">« Concepts and Architecture</a><a class="docs-footer-nextpage" href="../interfaces/">Spaces and Distributions »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/def_solver/index.html b/dev/def_solver/index.html
index 91575a93..4d0c36c6 100644
--- a/dev/def_solver/index.html
+++ b/dev/def_solver/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Solvers · POMDPs.jl</title><meta name="title" content="Solvers · POMDPs.jl"/><meta property="og:title" content="Solvers · POMDPs.jl"/><meta property="twitter:title" content="Solvers · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li class="is-active"><a class="tocitem" href>Solvers</a><ul class="internal"><li><a class="tocitem" href="#Online-and-Offline-Solvers"><span>Online and Offline Solvers</span></a></li><li><a class="tocitem" href="#Examples"><span>Examples</span></a></li></ul></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Writing Solvers</a></li><li class="is-active"><a href>Solvers</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Solvers</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/def_solver.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Solvers"><a class="docs-heading-anchor" href="#Solvers">Solvers</a><a id="Solvers-1"></a><a class="docs-heading-anchor-permalink" href="#Solvers" title="Permalink"></a></h1><p>Defining a solver involves creating or using four pieces of code:</p><ol><li>A subtype of <a href="../api/#POMDPs.Solver"><code>Solver</code></a> that holds the parameters and configuration options for the solver.</li><li>A subtype of <a href="../api/#POMDPs.Policy"><code>Policy</code></a> that holds all of the data needed to choose actions online.</li><li>A method of <a href="../api/#POMDPs.solve"><code>solve</code></a> that takes the <code>Solver</code> and a (PO)MDP as arguments, performs all of the <em>offline</em> computations for solving the problem, and returns the policy.</li><li>A method of <a href="../api/#POMDPs.action"><code>action</code></a> that takes in the policy and a state or belief and returns an action.</li></ol><p>In many cases, items 2 and 4 can be satisfied with an off-the-shelf <code>Policy</code> from the <a href="../POMDPTools/#pomdptools_section">POMDPTools package</a>. also contains many tools that are useful for defining solvers in a robust, concise, and readable manner.</p><h2 id="Online-and-Offline-Solvers"><a class="docs-heading-anchor" href="#Online-and-Offline-Solvers">Online and Offline Solvers</a><a id="Online-and-Offline-Solvers-1"></a><a class="docs-heading-anchor-permalink" href="#Online-and-Offline-Solvers" title="Permalink"></a></h2><p>Generally, solvers can be grouped into two categories: <em>Offline</em> solvers that do most of their computational work <em>before</em> interacting with the environment, and <em>online</em> solvers that do their work online as each new state or observation is encountered. Although offline and online solvers both use the exact same <a href="../api/#POMDPs.Solver"><code>Solver</code></a>, <a href="../api/#POMDPs.solve"><code>solve</code></a>, <a href="../api/#POMDPs.Policy"><code>Policy</code></a>, <a href="../api/#POMDPs.action"><code>action</code></a> structure, the work of defining online and offline solvers is focused on different portions.</p><p>For an offline solver, most of the implementation effort will be spent on the [<code>solve</code>] function, and an off-the-shelf policy from <a href="../POMDPTools/#pomdptools_section">POMDPTools</a> will typically be used.</p><p>For an online solver, the <a href="../api/#POMDPs.solve"><code>solve</code></a> function typically does little or no work, but merely creates a <code>Policy</code> object that will carry out computation online. It is typical in POMDPs.jl to use the term &quot;Planner&quot; to name a <a href="../api/#POMDPs.Policy"><code>Policy</code></a> object for an online solver that carries out a large amount of computation (&quot;planning&quot;) at interaction time. In this case most of the effort will be focused on implementing the <a href="../api/#POMDPs.action"><code>action</code></a> method for the &quot;Planner&quot; <code>Policy</code> type.</p><h2 id="Examples"><a class="docs-heading-anchor" href="#Examples">Examples</a><a id="Examples-1"></a><a class="docs-heading-anchor-permalink" href="#Examples" title="Permalink"></a></h2><p>Solver implementation is most clearly explained through examples. The following sections contain examples of both online and offline solver definitions:</p><ul><li><a href="../offline_solver/#Example:-Defining-an-offline-solver">Example: Defining an offline solver</a></li><li><a href="../online_solver/#Example:-Defining-an-online-solver">Example: Defining an online solver</a></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../interfaces/">« Spaces and Distributions</a><a class="docs-footer-nextpage" href="../offline_solver/">Example: Defining an offline solver »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Solvers · POMDPs.jl</title><meta name="title" content="Solvers · POMDPs.jl"/><meta property="og:title" content="Solvers · POMDPs.jl"/><meta property="twitter:title" content="Solvers · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li class="is-active"><a class="tocitem" href>Solvers</a><ul class="internal"><li><a class="tocitem" href="#Online-and-Offline-Solvers"><span>Online and Offline Solvers</span></a></li><li><a class="tocitem" href="#Examples"><span>Examples</span></a></li></ul></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Writing Solvers</a></li><li class="is-active"><a href>Solvers</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Solvers</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/def_solver.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Solvers"><a class="docs-heading-anchor" href="#Solvers">Solvers</a><a id="Solvers-1"></a><a class="docs-heading-anchor-permalink" href="#Solvers" title="Permalink"></a></h1><p>Defining a solver involves creating or using four pieces of code:</p><ol><li>A subtype of <a href="../api/#POMDPs.Solver"><code>Solver</code></a> that holds the parameters and configuration options for the solver.</li><li>A subtype of <a href="../api/#POMDPs.Policy"><code>Policy</code></a> that holds all of the data needed to choose actions online.</li><li>A method of <a href="../api/#POMDPs.solve"><code>solve</code></a> that takes the <code>Solver</code> and a (PO)MDP as arguments, performs all of the <em>offline</em> computations for solving the problem, and returns the policy.</li><li>A method of <a href="../api/#POMDPs.action"><code>action</code></a> that takes in the policy and a state or belief and returns an action.</li></ol><p>In many cases, items 2 and 4 can be satisfied with an off-the-shelf <code>Policy</code> from the <a href="../POMDPTools/#pomdptools_section">POMDPTools package</a>. also contains many tools that are useful for defining solvers in a robust, concise, and readable manner.</p><h2 id="Online-and-Offline-Solvers"><a class="docs-heading-anchor" href="#Online-and-Offline-Solvers">Online and Offline Solvers</a><a id="Online-and-Offline-Solvers-1"></a><a class="docs-heading-anchor-permalink" href="#Online-and-Offline-Solvers" title="Permalink"></a></h2><p>Generally, solvers can be grouped into two categories: <em>Offline</em> solvers that do most of their computational work <em>before</em> interacting with the environment, and <em>online</em> solvers that do their work online as each new state or observation is encountered. Although offline and online solvers both use the exact same <a href="../api/#POMDPs.Solver"><code>Solver</code></a>, <a href="../api/#POMDPs.solve"><code>solve</code></a>, <a href="../api/#POMDPs.Policy"><code>Policy</code></a>, <a href="../api/#POMDPs.action"><code>action</code></a> structure, the work of defining online and offline solvers is focused on different portions.</p><p>For an offline solver, most of the implementation effort will be spent on the [<code>solve</code>] function, and an off-the-shelf policy from <a href="../POMDPTools/#pomdptools_section">POMDPTools</a> will typically be used.</p><p>For an online solver, the <a href="../api/#POMDPs.solve"><code>solve</code></a> function typically does little or no work, but merely creates a <code>Policy</code> object that will carry out computation online. It is typical in POMDPs.jl to use the term &quot;Planner&quot; to name a <a href="../api/#POMDPs.Policy"><code>Policy</code></a> object for an online solver that carries out a large amount of computation (&quot;planning&quot;) at interaction time. In this case most of the effort will be focused on implementing the <a href="../api/#POMDPs.action"><code>action</code></a> method for the &quot;Planner&quot; <code>Policy</code> type.</p><h2 id="Examples"><a class="docs-heading-anchor" href="#Examples">Examples</a><a id="Examples-1"></a><a class="docs-heading-anchor-permalink" href="#Examples" title="Permalink"></a></h2><p>Solver implementation is most clearly explained through examples. The following sections contain examples of both online and offline solver definitions:</p><ul><li><a href="../offline_solver/#Example:-Defining-an-offline-solver">Example: Defining an offline solver</a></li><li><a href="../online_solver/#Example:-Defining-an-online-solver">Example: Defining an online solver</a></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../interfaces/">« Spaces and Distributions</a><a class="docs-footer-nextpage" href="../offline_solver/">Example: Defining an offline solver »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/def_updater/index.html b/dev/def_updater/index.html
index 200de762..0e4134f3 100644
--- a/dev/def_updater/index.html
+++ b/dev/def_updater/index.html
@@ -29,4 +29,4 @@
 b = Any[POMDPModels.BoolDistribution(0.0), false, false]
 b = Any[POMDPModels.BoolDistribution(0.0), false, false, false, false]
 b = Any[POMDPModels.BoolDistribution(0.0), false, false, false, false, true, false]
-b = Any[POMDPModels.BoolDistribution(0.0), false, false, false, false, true, false, true, false]</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../online_solver/">« Example: Defining an online solver</a><a class="docs-footer-nextpage" href="../simulation/">Simulation Standard »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+b = Any[POMDPModels.BoolDistribution(0.0), false, false, false, false, true, false, true, false]</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../online_solver/">« Example: Defining an online solver</a><a class="docs-footer-nextpage" href="../simulation/">Simulation Standard »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/example_defining_problems/index.html b/dev/example_defining_problems/index.html
index f71ee4f9..7e71aa2f 100644
--- a/dev/example_defining_problems/index.html
+++ b/dev/example_defining_problems/index.html
@@ -247,4 +247,4 @@
      
 discount = 0.9
 
-tabular_crying_baby_pomdp = TabularPOMDP(T, R, O, discount)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../examples/">« Examples</a><a class="docs-footer-nextpage" href="../example_solvers/">Using Different Solvers »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+tabular_crying_baby_pomdp = TabularPOMDP(T, R, O, discount)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../examples/">« Examples</a><a class="docs-footer-nextpage" href="../example_solvers/">Using Different Solvers »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/example_gridworld_mdp/index.html b/dev/example_gridworld_mdp/index.html
index ebdf36ba..16d2694b 100644
--- a/dev/example_gridworld_mdp/index.html
+++ b/dev/example_gridworld_mdp/index.html
@@ -48,10 +48,10 @@
 	Size x: 10
 	Size y: 10
 	Reward states:
-		Main.GridWorldState(8, 8) =&gt; 3.0
 		Main.GridWorldState(4, 3) =&gt; -10.0
-		Main.GridWorldState(4, 6) =&gt; -5.0
 		Main.GridWorldState(9, 3) =&gt; 10.0
+		Main.GridWorldState(4, 6) =&gt; -5.0
+		Main.GridWorldState(8, 8) =&gt; 3.0
 	Hit wall reward: -1.0
 	Transition probability: 0.7
 	Discount: 0.9
@@ -239,30 +239,30 @@
 solver = ValueIterationSolver(; max_iterations=100, belres=1e-3, verbose=true)
 
 # Solve for an optimal policy
-vi_policy = POMDPs.solve(solver, mdp)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">[Iteration 1   ] residual:         10 | iteration runtime:      0.227 ms, (  0.000227 s total)
-[Iteration 2   ] residual:        6.3 | iteration runtime:      0.232 ms, (  0.000459 s total)
-[Iteration 3   ] residual:       4.53 | iteration runtime:      0.214 ms, (  0.000673 s total)
-[Iteration 4   ] residual:       3.21 | iteration runtime:      0.211 ms, (  0.000885 s total)
-[Iteration 5   ] residual:       2.31 | iteration runtime:      0.213 ms, (    0.0011 s total)
-[Iteration 6   ] residual:       1.62 | iteration runtime:      0.212 ms, (   0.00131 s total)
-[Iteration 7   ] residual:       1.24 | iteration runtime:      0.211 ms, (   0.00152 s total)
-[Iteration 8   ] residual:       1.06 | iteration runtime:      0.206 ms, (   0.00173 s total)
-[Iteration 9   ] residual:      0.865 | iteration runtime:      0.209 ms, (   0.00194 s total)
-[Iteration 10  ] residual:      0.657 | iteration runtime:      0.206 ms, (   0.00214 s total)
-[Iteration 11  ] residual:      0.545 | iteration runtime:      0.217 ms, (   0.00236 s total)
-[Iteration 12  ] residual:      0.455 | iteration runtime:      0.209 ms, (   0.00257 s total)
-[Iteration 13  ] residual:      0.378 | iteration runtime:      0.208 ms, (   0.00278 s total)
-[Iteration 14  ] residual:      0.306 | iteration runtime:      0.208 ms, (   0.00298 s total)
-[Iteration 15  ] residual:      0.211 | iteration runtime:      0.209 ms, (   0.00319 s total)
-[Iteration 16  ] residual:      0.132 | iteration runtime:      0.210 ms, (    0.0034 s total)
-[Iteration 17  ] residual:     0.0778 | iteration runtime:      0.208 ms, (   0.00361 s total)
-[Iteration 18  ] residual:     0.0437 | iteration runtime:      0.209 ms, (   0.00382 s total)
-[Iteration 19  ] residual:     0.0237 | iteration runtime:      0.208 ms, (   0.00403 s total)
-[Iteration 20  ] residual:     0.0125 | iteration runtime:      0.233 ms, (   0.00426 s total)
-[Iteration 21  ] residual:    0.00649 | iteration runtime:      0.210 ms, (   0.00447 s total)
-[Iteration 22  ] residual:    0.00332 | iteration runtime:      0.208 ms, (   0.00468 s total)
-[Iteration 23  ] residual:    0.00167 | iteration runtime:      0.210 ms, (   0.00489 s total)
-[Iteration 24  ] residual:   0.000834 | iteration runtime:      0.210 ms, (    0.0051 s total)</code></pre><p>We can now use the policy to compute the optimal action for a given state:</p><pre><code class="language-julia hljs">s = GridWorldState(9, 2)
+vi_policy = POMDPs.solve(solver, mdp)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">[Iteration 1   ] residual:         10 | iteration runtime:      0.215 ms, (  0.000215 s total)
+[Iteration 2   ] residual:        6.3 | iteration runtime:      0.244 ms, (  0.000459 s total)
+[Iteration 3   ] residual:       4.53 | iteration runtime:      0.222 ms, (  0.000681 s total)
+[Iteration 4   ] residual:       3.21 | iteration runtime:      0.218 ms, (  0.000899 s total)
+[Iteration 5   ] residual:       2.31 | iteration runtime:      0.228 ms, (   0.00113 s total)
+[Iteration 6   ] residual:       1.62 | iteration runtime:      0.318 ms, (   0.00144 s total)
+[Iteration 7   ] residual:       1.24 | iteration runtime:      0.249 ms, (   0.00169 s total)
+[Iteration 8   ] residual:       1.06 | iteration runtime:      0.260 ms, (   0.00195 s total)
+[Iteration 9   ] residual:      0.865 | iteration runtime:      0.230 ms, (   0.00218 s total)
+[Iteration 10  ] residual:      0.657 | iteration runtime:      0.232 ms, (   0.00242 s total)
+[Iteration 11  ] residual:      0.545 | iteration runtime:      0.232 ms, (   0.00265 s total)
+[Iteration 12  ] residual:      0.455 | iteration runtime:      0.212 ms, (   0.00286 s total)
+[Iteration 13  ] residual:      0.378 | iteration runtime:      0.214 ms, (   0.00307 s total)
+[Iteration 14  ] residual:      0.306 | iteration runtime:      0.211 ms, (   0.00329 s total)
+[Iteration 15  ] residual:      0.211 | iteration runtime:      0.209 ms, (   0.00349 s total)
+[Iteration 16  ] residual:      0.132 | iteration runtime:      0.208 ms, (    0.0037 s total)
+[Iteration 17  ] residual:     0.0778 | iteration runtime:      0.212 ms, (   0.00391 s total)
+[Iteration 18  ] residual:     0.0437 | iteration runtime:      0.211 ms, (   0.00413 s total)
+[Iteration 19  ] residual:     0.0237 | iteration runtime:      0.209 ms, (   0.00433 s total)
+[Iteration 20  ] residual:     0.0125 | iteration runtime:      0.210 ms, (   0.00454 s total)
+[Iteration 21  ] residual:    0.00649 | iteration runtime:      0.212 ms, (   0.00476 s total)
+[Iteration 22  ] residual:    0.00332 | iteration runtime:      0.212 ms, (   0.00497 s total)
+[Iteration 23  ] residual:    0.00167 | iteration runtime:      0.215 ms, (   0.00518 s total)
+[Iteration 24  ] residual:   0.000834 | iteration runtime:      0.211 ms, (    0.0054 s total)</code></pre><p>We can now use the policy to compute the optimal action for a given state:</p><pre><code class="language-julia hljs">s = GridWorldState(9, 2)
 @show action(vi_policy, s)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">:up</code></pre><pre><code class="language-julia hljs">s = GridWorldState(8, 3)
 @show action(vi_policy, s)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">:right</code></pre><h2 id="Solving-the-Grid-World-MDP-(MCTS)"><a class="docs-heading-anchor" href="#Solving-the-Grid-World-MDP-(MCTS)">Solving the Grid World MDP (MCTS)</a><a id="Solving-the-Grid-World-MDP-(MCTS)-1"></a><a class="docs-heading-anchor-permalink" href="#Solving-the-Grid-World-MDP-(MCTS)" title="Permalink"></a></h2><p>Similar to the process with Value Iteration, we can solve the MDP using MCTS. We will use the <code>MCTSSolver</code> from the <a href="https://github.com/JuliaPOMDP/MCTS.jl">MCTS</a> package.</p><pre><code class="language-julia hljs"># Initialize the problem (we have already done this, but just calling it again for completeness in the example)
 mdp = GridWorldMDP()
@@ -367,4 +367,4 @@
  2 | →  →  →  →  →  →  →  →  ↑  ↑ |
  1 | →  →  →  →  →  →  ↑  ↑  ↑  ↑ |
    ------------------------------
-    1  2  3  4  5  6  7  8  9  10</code></pre><h2 id="Seeing-a-Policy-In-Action"><a class="docs-heading-anchor" href="#Seeing-a-Policy-In-Action">Seeing a Policy In Action</a><a id="Seeing-a-Policy-In-Action-1"></a><a class="docs-heading-anchor-permalink" href="#Seeing-a-Policy-In-Action" title="Permalink"></a></h2><p>Another useful tool is to view the policy in action by creating a gif of a simulation. To accomplish this, we could use <a href="https://github.com/JuliaPOMDP/POMDPGifs.jl">POMDPGifs</a>. To use POMDPGifs, we need to extend the <a href="../POMDPTools/visualization/#POMDPTools.ModelTools.render"><code>POMDPTools.render</code></a> function to <code>GridWorldMDP</code>. Please reference <a href="../gallery/#Gallery-of-POMDPs.jl-Problems">Gallery of POMDPs.jl Problems</a> for examples of this process.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_simulations/">« Simulations Examples</a><a class="docs-footer-nextpage" href="../gallery/">Gallery of POMDPs.jl Problems »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+    1  2  3  4  5  6  7  8  9  10</code></pre><h2 id="Seeing-a-Policy-In-Action"><a class="docs-heading-anchor" href="#Seeing-a-Policy-In-Action">Seeing a Policy In Action</a><a id="Seeing-a-Policy-In-Action-1"></a><a class="docs-heading-anchor-permalink" href="#Seeing-a-Policy-In-Action" title="Permalink"></a></h2><p>Another useful tool is to view the policy in action by creating a gif of a simulation. To accomplish this, we could use <a href="https://github.com/JuliaPOMDP/POMDPGifs.jl">POMDPGifs</a>. To use POMDPGifs, we need to extend the <a href="../POMDPTools/visualization/#POMDPTools.ModelTools.render"><code>POMDPTools.render</code></a> function to <code>GridWorldMDP</code>. Please reference <a href="../gallery/#Gallery-of-POMDPs.jl-Problems">Gallery of POMDPs.jl Problems</a> for examples of this process.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_simulations/">« Simulations Examples</a><a class="docs-footer-nextpage" href="../gallery/">Gallery of POMDPs.jl Problems »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/example_simulations/index.html b/dev/example_simulations/index.html
index 5f54059b..bc67cb19 100644
--- a/dev/example_simulations/index.html
+++ b/dev/example_simulations/index.html
@@ -24,21 +24,21 @@
 Step 2
 b = sated =&gt; 0.989010989010989, hungry =&gt; 0.010989010989010992
 s = :sated
-a = :feed
+a = :ignore
 o = :quiet
-r = -5.0
-r_sum = -5.5
+r = 0.0
+r_sum = -0.5
 
 Step 3
-b = sated =&gt; 1.0, hungry =&gt; 0.0
+b = sated =&gt; 0.9732977303070761, hungry =&gt; 0.026702269692923903
 s = :sated
-a = :ignore
-o = :quiet
-r = 0.0
+a = :feed
+o = :crying
+r = -5.0
 r_sum = -5.5
 
 Step 4
-b = sated =&gt; 0.9759036144578314, hungry =&gt; 0.024096385542168676
+b = sated =&gt; 1.0, hungry =&gt; 0.0
 s = :sated
 a = :sing
 o = :quiet
@@ -46,20 +46,20 @@
 r_sum = -6.0</code></pre><h2 id="Rollout-Simulations"><a class="docs-heading-anchor" href="#Rollout-Simulations">Rollout Simulations</a><a id="Rollout-Simulations-1"></a><a class="docs-heading-anchor-permalink" href="#Rollout-Simulations" title="Permalink"></a></h2><p>While stepthrough is a flexible and convenient tool for many user-facing demonstrations, it is often less error-prone to use the standard simulate function with a <code>Simulator</code> object. The simplest Simulator is the <code>RolloutSimulator</code>. It simply runs a simulation and returns the discounted reward. </p><pre><code class="language-julia hljs">policy = RandomPolicy(explicit_crying_baby_pomdp)
 sim = RolloutSimulator(max_steps=10)
 r_sum = simulate(sim, explicit_crying_baby_pomdp, policy)
-println(&quot;Total discounted reward: $r_sum&quot;)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">Total discounted reward: -45.4782422345</code></pre><h2 id="Recording-Histories"><a class="docs-heading-anchor" href="#Recording-Histories">Recording Histories</a><a id="Recording-Histories-1"></a><a class="docs-heading-anchor-permalink" href="#Recording-Histories" title="Permalink"></a></h2><p>Sometimes it is important to record the entire history of a simulation for further examination. This can be accomplished with a <code>HistoryRecorder</code>.</p><pre><code class="language-julia hljs">policy = RandomPolicy(tabular_crying_baby_pomdp)
+println(&quot;Total discounted reward: $r_sum&quot;)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">Total discounted reward: -49.81028715</code></pre><h2 id="Recording-Histories"><a class="docs-heading-anchor" href="#Recording-Histories">Recording Histories</a><a id="Recording-Histories-1"></a><a class="docs-heading-anchor-permalink" href="#Recording-Histories" title="Permalink"></a></h2><p>Sometimes it is important to record the entire history of a simulation for further examination. This can be accomplished with a <code>HistoryRecorder</code>.</p><pre><code class="language-julia hljs">policy = RandomPolicy(tabular_crying_baby_pomdp)
 hr = HistoryRecorder(max_steps=5)
-history = simulate(hr, tabular_crying_baby_pomdp, policy, DiscreteUpdater(tabular_crying_baby_pomdp), Deterministic(1))</code></pre><p>The history object produced by a <code>HistoryRecorder</code> is a <code>SimHistory</code>, documented in the POMDPTools simulater section <a href="../POMDPTools/simulators/#Histories">Histories</a>. The information in this object can be accessed in several ways. For example, there is a function:</p><pre><code class="language-julia hljs">discounted_reward(history)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">-14.543550000000002</code></pre><p>Accessor functions like <code>state_hist</code> and <code>action_hist</code> can also be used to access parts of the history:</p><pre><code class="language-julia hljs">state_hist(history)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">6-element Vector{Int64}:
+history = simulate(hr, tabular_crying_baby_pomdp, policy, DiscreteUpdater(tabular_crying_baby_pomdp), Deterministic(1))</code></pre><p>The history object produced by a <code>HistoryRecorder</code> is a <code>SimHistory</code>, documented in the POMDPTools simulater section <a href="../POMDPTools/simulators/#Histories">Histories</a>. The information in this object can be accessed in several ways. For example, there is a function:</p><pre><code class="language-julia hljs">discounted_reward(history)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">-9.05</code></pre><p>Accessor functions like <code>state_hist</code> and <code>action_hist</code> can also be used to access parts of the history:</p><pre><code class="language-julia hljs">state_hist(history)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">6-element Vector{Int64}:
  1
+ 1
+ 1
+ 1
+ 1
+ 1</code></pre><pre><code class="language-julia hljs">collect(action_hist(history))</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">5-element Vector{Int64}:
  2
+ 1
  2
  2
- 2
- 2</code></pre><pre><code class="language-julia hljs">collect(action_hist(history))</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">5-element Vector{Int64}:
- 3
- 3
- 3
- 2
- 2</code></pre><p>Keeping track of which states, actions, and observations belong together can be tricky (for example, since there is a starting state, and ending state, but no action is taken from the ending state, the list of actions has a different length than the list of states). It is often better to think of histories in terms of steps that include both starting and ending states.</p><p>The most powerful function for accessing the information in a <code>SimHistory</code> is the <code>eachstep</code> function which returns an iterator through named tuples representing each step in the history. The <code>eachstep</code> function is similar to the <code>stepthrough</code> function above except that it iterates through the immutable steps of a previously simulated history instead of conducting the simulation as the for loop is being carried out.</p><pre><code class="language-julia hljs">r_sum = 0.0
+ 1</code></pre><p>Keeping track of which states, actions, and observations belong together can be tricky (for example, since there is a starting state, and ending state, but no action is taken from the ending state, the list of actions has a different length than the list of states). It is often better to think of histories in terms of steps that include both starting and ending states.</p><p>The most powerful function for accessing the information in a <code>SimHistory</code> is the <code>eachstep</code> function which returns an iterator through named tuples representing each step in the history. The <code>eachstep</code> function is similar to the <code>stepthrough</code> function above except that it iterates through the immutable steps of a previously simulated history instead of conducting the simulation as the for loop is being carried out.</p><pre><code class="language-julia hljs">r_sum = 0.0
 step = 0
 for step_i in eachstep(sim_history, &quot;b,s,a,o,r&quot;)
     step += 1
@@ -76,42 +76,42 @@
 end # hide</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">Step 1
 step_i.b = sated =&gt; 1.0, hungry =&gt; 0.0
 step_i.s = 1
-step_i.a = 3
+step_i.a = 2
 step_i.o = 2
-step_i.r = 0.0
-r_sum = 0.0
+step_i.r = -0.5
+r_sum = -0.5
 
 Step 2
-step_i.b = sated =&gt; 0.9759036144578314, hungry =&gt; 0.024096385542168676
-step_i.s = 2
-step_i.a = 3
+step_i.b = sated =&gt; 0.989010989010989, hungry =&gt; 0.010989010989010992
+step_i.s = 1
+step_i.a = 1
 step_i.o = 2
-step_i.r = 0.0
-r_sum = 0.0
+step_i.r = -5.0
+r_sum = -5.5
 
 Step 3
-step_i.b = sated =&gt; 0.9701315984030756, hungry =&gt; 0.029868401596924443
-step_i.s = 2
-step_i.a = 3
-step_i.o = 1
-step_i.r = 0.0
-r_sum = 0.0
+step_i.b = sated =&gt; 1.0, hungry =&gt; 0.0
+step_i.s = 1
+step_i.a = 2
+step_i.o = 2
+step_i.r = -0.5
+r_sum = -6.0
 
 Step 4
-step_i.b = sated =&gt; 0.4624149353547852, hungry =&gt; 0.5375850646452149
-step_i.s = 2
+step_i.b = sated =&gt; 0.989010989010989, hungry =&gt; 0.010989010989010992
+step_i.s = 1
 step_i.a = 2
-step_i.o = 1
-step_i.r = -10.5
-r_sum = -10.5
+step_i.o = 2
+step_i.r = -0.5
+r_sum = -6.5
 
 Step 5
-step_i.b = sated =&gt; 0.0, hungry =&gt; 1.0
-step_i.s = 2
-step_i.a = 2
+step_i.b = sated =&gt; 0.9878048780487805, hungry =&gt; 0.012195121951219514
+step_i.s = 1
+step_i.a = 1
 step_i.o = 1
-step_i.r = -10.5
-r_sum = -21.0</code></pre><h2 id="Parallel-Simulations"><a class="docs-heading-anchor" href="#Parallel-Simulations">Parallel Simulations</a><a id="Parallel-Simulations-1"></a><a class="docs-heading-anchor-permalink" href="#Parallel-Simulations" title="Permalink"></a></h2><p>It is often useful to evaluate a policy by running many simulations. The parallel simulator is the most effective tool for this. To use the parallel simulator, first create a list of <code>Sim</code> objects, each of which contains all of the information needed to run a simulation. Then then run the simulations using <code>run_parallel</code>, which will return a <code>DataFrame</code> with the results.</p><p>In this example, we will compare the performance of the polcies we computed in the <a href="../example_solvers/#Using-Different-Solvers">Using Different Solvers</a> section (i.e. <code>sarsop_policy</code>, <code>pomcp_planner</code>, and <code>heuristic_policy</code>). To evaluate the policies, we will run 100 simulations for each policy. We can do this by adding 100 <code>Sim</code> objects of each policy to the list.</p><pre><code class="language-julia hljs">using DataFrames
+step_i.r = -5.0
+r_sum = -11.5</code></pre><h2 id="Parallel-Simulations"><a class="docs-heading-anchor" href="#Parallel-Simulations">Parallel Simulations</a><a id="Parallel-Simulations-1"></a><a class="docs-heading-anchor-permalink" href="#Parallel-Simulations" title="Permalink"></a></h2><p>It is often useful to evaluate a policy by running many simulations. The parallel simulator is the most effective tool for this. To use the parallel simulator, first create a list of <code>Sim</code> objects, each of which contains all of the information needed to run a simulation. Then then run the simulations using <code>run_parallel</code>, which will return a <code>DataFrame</code> with the results.</p><p>In this example, we will compare the performance of the polcies we computed in the <a href="../example_solvers/#Using-Different-Solvers">Using Different Solvers</a> section (i.e. <code>sarsop_policy</code>, <code>pomcp_planner</code>, and <code>heuristic_policy</code>). To evaluate the policies, we will run 100 simulations for each policy. We can do this by adding 100 <code>Sim</code> objects of each policy to the list.</p><pre><code class="language-julia hljs">using DataFrames
 using StatsBase: std
 
 # Defining paramters for the simulations
@@ -178,4 +178,4 @@
 
 # Calculate the mean and confidence interval for each policy
 grouped_df = groupby(data, :policy)
-result = combine(grouped_df, :reward =&gt; mean_and_ci =&gt; AsTable)</code></pre><div><div style = "float: left;"><span>4×3 DataFrame</span></div><div style = "clear: both;"></div></div><div class = "data-frame" style = "overflow-x: scroll;"><table class = "data-frame" style = "margin-bottom: 6px;"><thead><tr class = "header"><th class = "rowNumber" style = "font-weight: bold; text-align: right;">Row</th><th style = "text-align: left;">policy</th><th style = "text-align: left;">mean</th><th style = "text-align: left;">ci</th></tr><tr class = "subheader headerLastRow"><th class = "rowNumber" style = "font-weight: bold; text-align: right;"></th><th title = "Union{Missing, String}" style = "text-align: left;">String?</th><th title = "Float64" style = "text-align: left;">Float64</th><th title = "Float64" style = "text-align: left;">Float64</th></tr></thead><tbody><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">1</td><td style = "text-align: left;">sarsop</td><td style = "text-align: right;">-14.6264</td><td style = "text-align: right;">1.81814</td></tr><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">2</td><td style = "text-align: left;">pomcp</td><td style = "text-align: right;">-18.6904</td><td style = "text-align: right;">1.57649</td></tr><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">3</td><td style = "text-align: left;">heuristic</td><td style = "text-align: right;">-15.4895</td><td style = "text-align: right;">1.96535</td></tr><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">4</td><td style = "text-align: left;">random</td><td style = "text-align: right;">-30.4201</td><td style = "text-align: right;">2.64208</td></tr></tbody></table></div><p>By default, the parallel simulator only returns the reward from each simulation, but more information can be gathered by specifying a function to analyze the <code>Sim</code>-history pair and record additional statistics. Reference the POMDPTools simulator section for more information (<a href="../POMDPTools/simulators/#Specifying-information-to-be-recorded">Specifying information to be recorded</a>).</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_solvers/">« Using Different Solvers</a><a class="docs-footer-nextpage" href="../example_gridworld_mdp/">GridWorld MDP Tutorial »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+result = combine(grouped_df, :reward =&gt; mean_and_ci =&gt; AsTable)</code></pre><div><div style = "float: left;"><span>4×3 DataFrame</span></div><div style = "clear: both;"></div></div><div class = "data-frame" style = "overflow-x: scroll;"><table class = "data-frame" style = "margin-bottom: 6px;"><thead><tr class = "header"><th class = "rowNumber" style = "font-weight: bold; text-align: right;">Row</th><th style = "text-align: left;">policy</th><th style = "text-align: left;">mean</th><th style = "text-align: left;">ci</th></tr><tr class = "subheader headerLastRow"><th class = "rowNumber" style = "font-weight: bold; text-align: right;"></th><th title = "Union{Missing, String}" style = "text-align: left;">String?</th><th title = "Float64" style = "text-align: left;">Float64</th><th title = "Float64" style = "text-align: left;">Float64</th></tr></thead><tbody><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">1</td><td style = "text-align: left;">sarsop</td><td style = "text-align: right;">-14.6264</td><td style = "text-align: right;">1.81814</td></tr><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">2</td><td style = "text-align: left;">pomcp</td><td style = "text-align: right;">-18.6904</td><td style = "text-align: right;">1.57649</td></tr><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">3</td><td style = "text-align: left;">heuristic</td><td style = "text-align: right;">-15.4871</td><td style = "text-align: right;">1.73522</td></tr><tr><td class = "rowNumber" style = "font-weight: bold; text-align: right;">4</td><td style = "text-align: left;">random</td><td style = "text-align: right;">-30.4201</td><td style = "text-align: right;">2.64208</td></tr></tbody></table></div><p>By default, the parallel simulator only returns the reward from each simulation, but more information can be gathered by specifying a function to analyze the <code>Sim</code>-history pair and record additional statistics. Reference the POMDPTools simulator section for more information (<a href="../POMDPTools/simulators/#Specifying-information-to-be-recorded">Specifying information to be recorded</a>).</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_solvers/">« Using Different Solvers</a><a class="docs-footer-nextpage" href="../example_gridworld_mdp/">GridWorld MDP Tutorial »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/example_solvers/index.html b/dev/example_solvers/index.html
index 7c33f48a..e94e2b26 100644
--- a/dev/example_solvers/index.html
+++ b/dev/example_solvers/index.html
@@ -25,19 +25,19 @@
 For solve(::QMDP.QMDPSolver, ::POMDP):
   [No additional requirements]
 For solve(::ValueIterationSolver, ::Union{MDP,POMDP}) (in solve(::QMDP.QMDPSolver, ::POMDP)):
-  [✔] discount(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol})
-  [✔] transition(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol, ::Symbol)
-  [✔] reward(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol, ::Symbol, ::Symbol)
-  [✔] stateindex(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol)
-  [✔] actionindex(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol)
-  [✔] actions(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol)
+  [✔] discount(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol})
+  [✔] transition(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol, ::Symbol)
+  [✔] reward(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol, ::Symbol, ::Symbol)
+  [✔] stateindex(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol)
+  [✔] actionindex(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol)
+  [✔] actions(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol}, ::Symbol)
   [✔] length(::Array{Symbol1})
   [✔] support(::Deterministic{Symbol})
   [✔] pdf(::Deterministic{Symbol}, ::Symbol)
 For ordered_states(::Union{MDP,POMDP}) (in solve(::ValueIterationSolver, ::Union{MDP,POMDP})):
-  [✔] states(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol})
+  [✔] states(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol})
 For ordered_actions(::Union{MDP,POMDP}) (in solve(::ValueIterationSolver, ::Union{MDP,POMDP})):
-  [✔] actions(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;6ed96d00-fb5b-4b0b-95b8-068772e977d7&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol})
+  [✔] actions(::UnderlyingMDP{QuickPOMDPs.QuickPOMDP{UUID(&quot;bc06d3ef-e7bc-4206-81ed-395883874f86&quot;), Symbol, Symbol, Symbol, @NamedTuple{stateindex::Dict{Symbol, Int64}, isterminal::Bool, obsindex::Dict{Symbol, Int64}, states::Vector{Symbol}, observations::Vector{Symbol}, discount::Float64, actions::Vector{Symbol}, observation::Main.var&quot;#2#5&quot;, actionindex::Dict{Symbol, Int64}, initialstate::Deterministic{Symbol}, transition::Main.var&quot;#1#4&quot;, reward::Main.var&quot;#3#6&quot;}}SymbolSymbol})
 
 Explicit Crying Baby POMDP
 INFO: POMDPLinter requirements for solve(::QMDP.QMDPSolver, ::POMDP) and dependencies. ([✔] = implemented correctly; [X] = not implemented; [?] = could not determine)
@@ -152,4 +152,4 @@
 
 @show [a1, a2]</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">2-element Vector{Symbol}:
  :feed
- :sing</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_defining_problems/">« Defining a POMDP</a><a class="docs-footer-nextpage" href="../example_simulations/">Simulations Examples »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+ :ignore</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_defining_problems/">« Defining a POMDP</a><a class="docs-footer-nextpage" href="../example_simulations/">Simulations Examples »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/examples/index.html b/dev/examples/index.html
index c1e9c3cb..70a43e4b 100644
--- a/dev/examples/index.html
+++ b/dev/examples/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Examples · POMDPs.jl</title><meta name="title" content="Examples · POMDPs.jl"/><meta property="og:title" content="Examples · POMDPs.jl"/><meta property="twitter:title" content="Examples · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li class="is-active"><a class="tocitem" href>Examples</a><ul class="internal"><li><a class="tocitem" href="#Outline"><span>Outline</span></a></li></ul></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Examples and Gallery</a></li><li class="is-active"><a href>Examples</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Examples</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/examples.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="examples_section"><a class="docs-heading-anchor" href="#examples_section">Examples</a><a id="examples_section-1"></a><a class="docs-heading-anchor-permalink" href="#examples_section" title="Permalink"></a></h1><p>This section contains examples of how to use POMDPs.jl. For specific informaiton about the interface and functions used in the examples, please reference the correpsonding area in the documenation or the <a href="../api/#API-Documentation">API Documentation</a>.</p><p>The examples are organized by topic. The exmaples are designed to build through each step. First, we have to define a POMDP. Then we need to solve the POMDP to get a policy. Finally, we can simulate the policy to see how it performs. The examples are designed to be exeucted in order. For example, the examples in <a href="../example_simulations/#Simulations-Examples">Simulations Examples</a> assume that the POMDPs defined in the <a href="../example_defining_problems/#Defining-a-POMDP">Defining a POMDP</a> section have been defined and we have a policy we would like to simulate that we computed in the <a href="../example_solvers/#Using-Different-Solvers">Using Different Solvers</a> section.</p><p>The <a href="../example_gridworld_mdp/#GridWorld-MDP-Tutorial">GridWorld MDP Tutorial</a> section is a standalone example that does not require any of the other examples.</p><h2 id="Outline"><a class="docs-heading-anchor" href="#Outline">Outline</a><a id="Outline-1"></a><a class="docs-heading-anchor-permalink" href="#Outline" title="Permalink"></a></h2><ul><li><a href="../example_defining_problems/#Defining-a-POMDP">Defining a POMDP</a></li><li class="no-marker"><ul><li><a href="../example_defining_problems/#CryingBaby-Problem-Definition">CryingBaby Problem Definition</a></li><li><a href="../example_defining_problems/#quick_crying">QuickPOMDP Interface</a></li><li><a href="../example_defining_problems/#explicit_crying">Explicit Interface</a></li><li><a href="../example_defining_problems/#gen_crying">Generative Interface</a></li><li><a href="../example_defining_problems/#tab_crying">Probability Tables</a></li></ul></li><li><a href="../example_solvers/#Using-Different-Solvers">Using Different Solvers</a></li><li class="no-marker"><ul><li><a href="../example_solvers/#Checking-Requirements">Checking Requirements</a></li><li><a href="../example_solvers/#Offline-(SARSOP)">Offline (SARSOP)</a></li><li><a href="../example_solvers/#Online-(POMCP)">Online (POMCP)</a></li><li><a href="../example_solvers/#Heuristic-Policy">Heuristic Policy</a></li></ul></li><li><a href="../example_simulations/#Simulations-Examples">Simulations Examples</a></li><li class="no-marker"><ul><li><a href="../example_simulations/#Stepthrough">Stepthrough</a></li><li><a href="../example_simulations/#Rollout-Simulations">Rollout Simulations</a></li><li><a href="../example_simulations/#Recording-Histories">Recording Histories</a></li><li><a href="../example_simulations/#Parallel-Simulations">Parallel Simulations</a></li></ul></li><li><a href="../example_gridworld_mdp/#GridWorld-MDP-Tutorial">GridWorld MDP Tutorial</a></li><li class="no-marker"><ul><li><a href="../example_gridworld_mdp/#Dependencies">Dependencies</a></li><li><a href="../example_gridworld_mdp/#Problem-Overview">Problem Overview</a></li><li><a href="../example_gridworld_mdp/#Defining-the-Grid-World-MDP-Type">Defining the Grid World MDP Type</a></li><li><a href="../example_gridworld_mdp/#Grid-World-State-Space">Grid World State Space</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Action-Space">Grid World Action Space</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Transition-Function">Grid World Transition Function</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Reward-Function">Grid World Reward Function</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Remaining-Functions">Grid World Remaining Functions</a></li><li><a href="../example_gridworld_mdp/#Solving-the-Grid-World-MDP-(Value-Iteration)">Solving the Grid World MDP (Value Iteration)</a></li><li><a href="../example_gridworld_mdp/#Solving-the-Grid-World-MDP-(MCTS)">Solving the Grid World MDP (MCTS)</a></li><li><a href="../example_gridworld_mdp/#Visualizing-the-Value-Iteration-Policy">Visualizing the Value Iteration Policy</a></li><li><a href="../example_gridworld_mdp/#Seeing-a-Policy-In-Action">Seeing a Policy In Action</a></li></ul></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../policy_interaction/">« Interacting with Policies</a><a class="docs-footer-nextpage" href="../example_defining_problems/">Defining a POMDP »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Examples · POMDPs.jl</title><meta name="title" content="Examples · POMDPs.jl"/><meta property="og:title" content="Examples · POMDPs.jl"/><meta property="twitter:title" content="Examples · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li class="is-active"><a class="tocitem" href>Examples</a><ul class="internal"><li><a class="tocitem" href="#Outline"><span>Outline</span></a></li></ul></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Examples and Gallery</a></li><li class="is-active"><a href>Examples</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Examples</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/examples.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="examples_section"><a class="docs-heading-anchor" href="#examples_section">Examples</a><a id="examples_section-1"></a><a class="docs-heading-anchor-permalink" href="#examples_section" title="Permalink"></a></h1><p>This section contains examples of how to use POMDPs.jl. For specific informaiton about the interface and functions used in the examples, please reference the correpsonding area in the documenation or the <a href="../api/#API-Documentation">API Documentation</a>.</p><p>The examples are organized by topic. The exmaples are designed to build through each step. First, we have to define a POMDP. Then we need to solve the POMDP to get a policy. Finally, we can simulate the policy to see how it performs. The examples are designed to be exeucted in order. For example, the examples in <a href="../example_simulations/#Simulations-Examples">Simulations Examples</a> assume that the POMDPs defined in the <a href="../example_defining_problems/#Defining-a-POMDP">Defining a POMDP</a> section have been defined and we have a policy we would like to simulate that we computed in the <a href="../example_solvers/#Using-Different-Solvers">Using Different Solvers</a> section.</p><p>The <a href="../example_gridworld_mdp/#GridWorld-MDP-Tutorial">GridWorld MDP Tutorial</a> section is a standalone example that does not require any of the other examples.</p><h2 id="Outline"><a class="docs-heading-anchor" href="#Outline">Outline</a><a id="Outline-1"></a><a class="docs-heading-anchor-permalink" href="#Outline" title="Permalink"></a></h2><ul><li><a href="../example_defining_problems/#Defining-a-POMDP">Defining a POMDP</a></li><li class="no-marker"><ul><li><a href="../example_defining_problems/#CryingBaby-Problem-Definition">CryingBaby Problem Definition</a></li><li><a href="../example_defining_problems/#quick_crying">QuickPOMDP Interface</a></li><li><a href="../example_defining_problems/#explicit_crying">Explicit Interface</a></li><li><a href="../example_defining_problems/#gen_crying">Generative Interface</a></li><li><a href="../example_defining_problems/#tab_crying">Probability Tables</a></li></ul></li><li><a href="../example_solvers/#Using-Different-Solvers">Using Different Solvers</a></li><li class="no-marker"><ul><li><a href="../example_solvers/#Checking-Requirements">Checking Requirements</a></li><li><a href="../example_solvers/#Offline-(SARSOP)">Offline (SARSOP)</a></li><li><a href="../example_solvers/#Online-(POMCP)">Online (POMCP)</a></li><li><a href="../example_solvers/#Heuristic-Policy">Heuristic Policy</a></li></ul></li><li><a href="../example_simulations/#Simulations-Examples">Simulations Examples</a></li><li class="no-marker"><ul><li><a href="../example_simulations/#Stepthrough">Stepthrough</a></li><li><a href="../example_simulations/#Rollout-Simulations">Rollout Simulations</a></li><li><a href="../example_simulations/#Recording-Histories">Recording Histories</a></li><li><a href="../example_simulations/#Parallel-Simulations">Parallel Simulations</a></li></ul></li><li><a href="../example_gridworld_mdp/#GridWorld-MDP-Tutorial">GridWorld MDP Tutorial</a></li><li class="no-marker"><ul><li><a href="../example_gridworld_mdp/#Dependencies">Dependencies</a></li><li><a href="../example_gridworld_mdp/#Problem-Overview">Problem Overview</a></li><li><a href="../example_gridworld_mdp/#Defining-the-Grid-World-MDP-Type">Defining the Grid World MDP Type</a></li><li><a href="../example_gridworld_mdp/#Grid-World-State-Space">Grid World State Space</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Action-Space">Grid World Action Space</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Transition-Function">Grid World Transition Function</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Reward-Function">Grid World Reward Function</a></li><li><a href="../example_gridworld_mdp/#Grid-World-Remaining-Functions">Grid World Remaining Functions</a></li><li><a href="../example_gridworld_mdp/#Solving-the-Grid-World-MDP-(Value-Iteration)">Solving the Grid World MDP (Value Iteration)</a></li><li><a href="../example_gridworld_mdp/#Solving-the-Grid-World-MDP-(MCTS)">Solving the Grid World MDP (MCTS)</a></li><li><a href="../example_gridworld_mdp/#Visualizing-the-Value-Iteration-Policy">Visualizing the Value Iteration Policy</a></li><li><a href="../example_gridworld_mdp/#Seeing-a-Policy-In-Action">Seeing a Policy In Action</a></li></ul></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../policy_interaction/">« Interacting with Policies</a><a class="docs-footer-nextpage" href="../example_defining_problems/">Defining a POMDP »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/faq/index.html b/dev/faq/index.html
index 1801a46b..3b710a0e 100644
--- a/dev/faq/index.html
+++ b/dev/faq/index.html
@@ -14,4 +14,4 @@
   end
 end
 
-POMDPs.reward(m, s, a) = rdict[(s, a)]</code></pre><h2 id="Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?"><a class="docs-heading-anchor" href="#Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?">Why do I need to put type assertions pomdp::POMDP into the function signature?</a><a id="Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?-1"></a><a class="docs-heading-anchor-permalink" href="#Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?" title="Permalink"></a></h2><p>Specifying the type in your function signature allows Julia to call the appropriate function when your custom type is passed into it. For example if a POMDPs.jl solver calls <code>states</code> on the POMDP that you passed into it, the correct <code>states</code> function will only get dispatched if you specified that the <code>states</code> function you wrote works with your POMDP type. Because Julia supports multiple-dispatch, these type assertion are a way for doing object-oriented programming in Julia.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../POMDPTools/testing/">« Testing</a><a class="docs-footer-nextpage" href="../api/">API Documentation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+POMDPs.reward(m, s, a) = rdict[(s, a)]</code></pre><h2 id="Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?"><a class="docs-heading-anchor" href="#Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?">Why do I need to put type assertions pomdp::POMDP into the function signature?</a><a id="Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?-1"></a><a class="docs-heading-anchor-permalink" href="#Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?" title="Permalink"></a></h2><p>Specifying the type in your function signature allows Julia to call the appropriate function when your custom type is passed into it. For example if a POMDPs.jl solver calls <code>states</code> on the POMDP that you passed into it, the correct <code>states</code> function will only get dispatched if you specified that the <code>states</code> function you wrote works with your POMDP type. Because Julia supports multiple-dispatch, these type assertion are a way for doing object-oriented programming in Julia.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../POMDPTools/testing/">« Testing</a><a class="docs-footer-nextpage" href="../api/">API Documentation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/gallery/index.html b/dev/gallery/index.html
index 18152a7a..ba9d8c2d 100644
--- a/dev/gallery/index.html
+++ b/dev/gallery/index.html
@@ -187,4 +187,4 @@
 sim = GifSimulator(; filename=&quot;examples/TagPOMDP.gif&quot;, max_steps=50, rng=MersenneTwister(1), show_progress=false)
 saved_gif = simulate(sim, pomdp, policy)
 
-println(&quot;gif saved to: $(saved_gif.filename)&quot;)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">gif saved to: examples/TagPOMDP.gif</code></pre><h2 id="Adding-New-Gallery-Examples"><a class="docs-heading-anchor" href="#Adding-New-Gallery-Examples">Adding New Gallery Examples</a><a id="Adding-New-Gallery-Examples-1"></a><a class="docs-heading-anchor-permalink" href="#Adding-New-Gallery-Examples" title="Permalink"></a></h2><p>To add new examples, please submit a pull request to the POMDPs.jl repository with changes made to the <code>gallery.md</code> file in <code>docs/src/</code>. Please include the creation of a gif in the code snippet. The gif should be generated during the creation of the documenation using <code>@eval</code> and saved in the <code>docs/src/examples/</code> directory. The gif should be named <code>problem_name.gif</code> where <code>problem_name</code> is the name of the problem. The gif can then be included using <code>![problem_name](examples/problem_name.gif)</code>.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_gridworld_mdp/">« GridWorld MDP Tutorial</a><a class="docs-footer-nextpage" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+println(&quot;gif saved to: $(saved_gif.filename)&quot;)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">gif saved to: examples/TagPOMDP.gif</code></pre><h2 id="Adding-New-Gallery-Examples"><a class="docs-heading-anchor" href="#Adding-New-Gallery-Examples">Adding New Gallery Examples</a><a id="Adding-New-Gallery-Examples-1"></a><a class="docs-heading-anchor-permalink" href="#Adding-New-Gallery-Examples" title="Permalink"></a></h2><p>To add new examples, please submit a pull request to the POMDPs.jl repository with changes made to the <code>gallery.md</code> file in <code>docs/src/</code>. Please include the creation of a gif in the code snippet. The gif should be generated during the creation of the documenation using <code>@eval</code> and saved in the <code>docs/src/examples/</code> directory. The gif should be named <code>problem_name.gif</code> where <code>problem_name</code> is the name of the problem. The gif can then be included using <code>![problem_name](examples/problem_name.gif)</code>.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../example_gridworld_mdp/">« GridWorld MDP Tutorial</a><a class="docs-footer-nextpage" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/get_started/index.html b/dev/get_started/index.html
index e313c041..9ee119ae 100644
--- a/dev/get_started/index.html
+++ b/dev/get_started/index.html
@@ -13,4 +13,4 @@
 init_dist = initialstate(pomdp) # from POMDPModels
 hr = HistoryRecorder(max_steps=100) # from POMDPTools
 hist = simulate(hr, pomdp, policy, belief_updater, init_dist) # run 100 step simulation
-println(&quot;reward: $(discounted_reward(hist))&quot;)</code></pre><p>The first part of the code loads the desired packages and initializes the problem and the solver. Next, we compute a POMDP policy. Lastly, we evaluate the results.</p><p>There are a few things to mention here. First, the TigerPOMDP type implements all the functions required by QMDPSolver to compute a policy. Second, each policy has a default updater (essentially a filter used to update the belief of the POMDP). To learn more about Updaters check out the <a href="../concepts/#Concepts-and-Architecture">Concepts and Architecture</a> section.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../install/">« Installation</a><a class="docs-footer-nextpage" href="../concepts/">Concepts and Architecture »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+println(&quot;reward: $(discounted_reward(hist))&quot;)</code></pre><p>The first part of the code loads the desired packages and initializes the problem and the solver. Next, we compute a POMDP policy. Lastly, we evaluate the results.</p><p>There are a few things to mention here. First, the TigerPOMDP type implements all the functions required by QMDPSolver to compute a policy. Second, each policy has a default updater (essentially a filter used to update the belief of the POMDP). To learn more about Updaters check out the <a href="../concepts/#Concepts-and-Architecture">Concepts and Architecture</a> section.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../install/">« Installation</a><a class="docs-footer-nextpage" href="../concepts/">Concepts and Architecture »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/index.html b/dev/index.html
index 3d9263cb..4211d280 100644
--- a/dev/index.html
+++ b/dev/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>POMDPs.jl · POMDPs.jl</title><meta name="title" content="POMDPs.jl · POMDPs.jl"/><meta property="og:title" content="POMDPs.jl · POMDPs.jl"/><meta property="twitter:title" content="POMDPs.jl · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="assets/documenter.js"></script><script src="search_index.js"></script><script src="siteinfo.js"></script><script src="../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href><img src="assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href>POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li class="is-active"><a class="tocitem" href>POMDPs.jl</a><ul class="internal"><li><a class="tocitem" href="#Package-and-Ecosystem-Features"><span>Package and Ecosystem Features</span></a></li><li><a class="tocitem" href="#Available-Packages"><span>Available Packages</span></a></li><li><a class="tocitem" href="#Documentation-Outline"><span>Documentation Outline</span></a></li></ul></li><li><a class="tocitem" href="install/">Installation</a></li><li><a class="tocitem" href="get_started/">Getting Started</a></li><li><a class="tocitem" href="concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="def_solver/">Solvers</a></li><li><a class="tocitem" href="offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="simulation/">Simulation Standard</a></li><li><a class="tocitem" href="run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="examples/">Examples</a></li><li><a class="tocitem" href="example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Basics</a></li><li class="is-active"><a href>POMDPs.jl</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>POMDPs.jl</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/index.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)"><a class="docs-heading-anchor" href="#[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)"><a href="https://github.com/JuliaPOMDP/POMDPs.jl">POMDPs.jl</a></a><a id="[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)-1"></a><a class="docs-heading-anchor-permalink" href="#[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)" title="Permalink"></a></h1><p><em>A Julia interface for defining, solving and simulating partially observable Markov decision processes and their fully observable counterparts.</em></p><h2 id="Package-and-Ecosystem-Features"><a class="docs-heading-anchor" href="#Package-and-Ecosystem-Features">Package and Ecosystem Features</a><a id="Package-and-Ecosystem-Features-1"></a><a class="docs-heading-anchor-permalink" href="#Package-and-Ecosystem-Features" title="Permalink"></a></h2><ul><li>General interface that can handle problems with discrete and continuous state/action/observation spaces</li><li>A number of popular state-of-the-art solvers implemented for use out-of-the-box</li><li>Tools that make it easy to define problems and simulate solutions</li><li>Simple integration of custom solvers into the existing interface</li></ul><h2 id="Available-Packages"><a class="docs-heading-anchor" href="#Available-Packages">Available Packages</a><a id="Available-Packages-1"></a><a class="docs-heading-anchor-permalink" href="#Available-Packages" title="Permalink"></a></h2><p>The POMDPs.jl package contains only the interface used for expressing and solving Markov decision processes (MDPs) and partially observable Markov decision processes (POMDPs). The <a href="POMDPTools/#pomdptools_section">POMDPTools</a> package acts as a &quot;standard library&quot; for the POMDPs.jl interface, providing implementations of commonly-used components such as policies, belief updaters, distributions, and simulators. The list of solver and support packages maintained by the <a href="https://github.com/JuliaPOMDP">JuliaPOMDP</a> community is available at the <a href="https://github.com/JuliaPOMDP/POMDPs.jl#supported-packages">POMDPs.jl Readme</a>.</p><h2 id="Documentation-Outline"><a class="docs-heading-anchor" href="#Documentation-Outline">Documentation Outline</a><a id="Documentation-Outline-1"></a><a class="docs-heading-anchor-permalink" href="#Documentation-Outline" title="Permalink"></a></h2><p>Documentation comes in three forms:</p><ol><li>An explanatory guide is available in the sections outlined below.</li><li>How-to examples are available throughout this documentation with specicic examples in <a href="examples/#examples_section">Examples</a> and <a href="gallery/#Gallery-of-POMDPs.jl-Problems">Gallery of POMDPs.jl Problems</a>.</li><li>Reference docstrings for the entire POMDPs.jl interface are available in the <a href="api/#API-Documentation">API Documentation</a> section.</li></ol><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>When updating these documents, make sure this is synced with <a href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/make.jl">docs/make.jl</a>!!</p></div></div><h3 id="Basics"><a class="docs-heading-anchor" href="#Basics">Basics</a><a id="Basics-1"></a><a class="docs-heading-anchor-permalink" href="#Basics" title="Permalink"></a></h3><ul><li><a href="install/#Installation">Installation</a></li><li><a href="get_started/#Getting-Started">Getting Started</a></li><li><a href="concepts/#Concepts-and-Architecture">Concepts and Architecture</a></li><li class="no-marker"><ul><li><a href="concepts/#POMDPs-and-MDPs">POMDPs and MDPs</a></li><li><a href="concepts/#Beliefs-and-Updaters">Beliefs and Updaters</a></li><li><a href="concepts/#Solvers-and-Policies">Solvers and Policies</a></li><li><a href="concepts/#Simulators">Simulators</a></li></ul></li></ul><h3 id="Defining-POMDP-Models"><a class="docs-heading-anchor" href="#Defining-POMDP-Models">Defining POMDP Models</a><a id="Defining-POMDP-Models-1"></a><a class="docs-heading-anchor-permalink" href="#Defining-POMDP-Models" title="Permalink"></a></h3><ul><li><a href="def_pomdp/#defining_pomdps">Defining POMDPs and MDPs</a></li><li class="no-marker"><ul><li><a href="def_pomdp/#tiger">A Basic Example: The Tiger POMDP</a></li><li><a href="def_pomdp/#Guide-to-Defining-POMDPs">Guide to Defining POMDPs</a></li><li class="no-marker"><ul><li><a href="def_pomdp/#po-mountaincar">A more complex example: A partially-observable mountain car</a></li><li><a href="def_pomdp/#space_representation">State, action, and observation spaces</a></li><li><a href="def_pomdp/#Transition-and-observation-distributions-2">Transition and observation distributions</a></li><li><a href="def_pomdp/#Reward-functions">Reward functions</a></li><li><a href="def_pomdp/#Other-Components">Other Components</a></li></ul></li><li><a href="def_pomdp/#Other-ways-to-define-a-(PO)MDP">Other ways to define a (PO)MDP</a></li><li class="no-marker"><ul><li><a href="def_pomdp/#Object-oriented">Object-oriented</a></li><li><a href="def_pomdp/#Using-a-single-generative-function-instead-of-separate-T,-Z,-and-R">Using a single generative function instead of separate <span>$T$</span>, <span>$Z$</span>, and <span>$R$</span></a></li><li><a href="def_pomdp/#Tabular">Tabular</a></li></ul></li></ul></li><li><a href="interfaces/#Spaces-and-Distributions">Spaces and Distributions</a></li><li class="no-marker"><ul><li><a href="interfaces/#space-interface">Spaces</a></li><li><a href="interfaces/#Distributions">Distributions</a></li></ul></li></ul><h3 id="Writing-Solvers-and-Updaters"><a class="docs-heading-anchor" href="#Writing-Solvers-and-Updaters">Writing Solvers and Updaters</a><a id="Writing-Solvers-and-Updaters-1"></a><a class="docs-heading-anchor-permalink" href="#Writing-Solvers-and-Updaters" title="Permalink"></a></h3><ul><li><a href="def_solver/#Solvers">Solvers</a></li><li class="no-marker"><ul><li><a href="def_solver/#Online-and-Offline-Solvers">Online and Offline Solvers</a></li><li><a href="def_solver/#Examples">Examples</a></li></ul></li><li><a href="offline_solver/#Example:-Defining-an-offline-solver">Example: Defining an offline solver</a></li><li><a href="online_solver/#Example:-Defining-an-online-solver">Example: Defining an online solver</a></li><li><a href="def_updater/#Defining-a-Belief-Updater">Defining a Belief Updater</a></li><li class="no-marker"><ul><li><a href="def_updater/#Defining-a-Belief-Type">Defining a Belief Type</a></li><li><a href="def_updater/#Defining-an-Updater">Defining an Updater</a></li></ul></li></ul><h3 id="Analyzing-Results"><a class="docs-heading-anchor" href="#Analyzing-Results">Analyzing Results</a><a id="Analyzing-Results-1"></a><a class="docs-heading-anchor-permalink" href="#Analyzing-Results" title="Permalink"></a></h3><ul><li><a href="simulation/#Simulation-Standard">Simulation Standard</a></li><li class="no-marker"><ul><li><a href="simulation/#POMDP-Simulation">POMDP Simulation</a></li><li><a href="simulation/#MDP-Simulation">MDP Simulation</a></li></ul></li><li><a href="run_simulation/#Running-Simulations">Running Simulations</a></li><li><a href="policy_interaction/#Interacting-with-Policies">Interacting with Policies</a></li></ul><h3 id="Examples-and-Gallery"><a class="docs-heading-anchor" href="#Examples-and-Gallery">Examples and Gallery</a><a id="Examples-and-Gallery-1"></a><a class="docs-heading-anchor-permalink" href="#Examples-and-Gallery" title="Permalink"></a></h3><ul><li><a href="examples/#examples_section">Examples</a></li><li class="no-marker"><ul><li><a href="examples/#Outline">Outline</a></li></ul></li><li><a href="example_defining_problems/#Defining-a-POMDP">Defining a POMDP</a></li><li class="no-marker"><ul><li><a href="example_defining_problems/#CryingBaby-Problem-Definition">CryingBaby Problem Definition</a></li><li><a href="example_defining_problems/#quick_crying">QuickPOMDP Interface</a></li><li><a href="example_defining_problems/#explicit_crying">Explicit Interface</a></li><li><a href="example_defining_problems/#gen_crying">Generative Interface</a></li><li><a href="example_defining_problems/#tab_crying">Probability Tables</a></li></ul></li><li><a href="example_solvers/#Using-Different-Solvers">Using Different Solvers</a></li><li class="no-marker"><ul><li><a href="example_solvers/#Checking-Requirements">Checking Requirements</a></li><li><a href="example_solvers/#Offline-(SARSOP)">Offline (SARSOP)</a></li><li><a href="example_solvers/#Online-(POMCP)">Online (POMCP)</a></li><li><a href="example_solvers/#Heuristic-Policy">Heuristic Policy</a></li></ul></li><li><a href="example_simulations/#Simulations-Examples">Simulations Examples</a></li><li class="no-marker"><ul><li><a href="example_simulations/#Stepthrough">Stepthrough</a></li><li><a href="example_simulations/#Rollout-Simulations">Rollout Simulations</a></li><li><a href="example_simulations/#Recording-Histories">Recording Histories</a></li><li><a href="example_simulations/#Parallel-Simulations">Parallel Simulations</a></li></ul></li><li><a href="example_gridworld_mdp/#GridWorld-MDP-Tutorial">GridWorld MDP Tutorial</a></li><li class="no-marker"><ul><li><a href="example_gridworld_mdp/#Dependencies">Dependencies</a></li><li><a href="example_gridworld_mdp/#Problem-Overview">Problem Overview</a></li><li><a href="example_gridworld_mdp/#Defining-the-Grid-World-MDP-Type">Defining the Grid World MDP Type</a></li><li><a href="example_gridworld_mdp/#Grid-World-State-Space">Grid World State Space</a></li><li><a href="example_gridworld_mdp/#Grid-World-Action-Space">Grid World Action Space</a></li><li><a href="example_gridworld_mdp/#Grid-World-Transition-Function">Grid World Transition Function</a></li><li><a href="example_gridworld_mdp/#Grid-World-Reward-Function">Grid World Reward Function</a></li><li><a href="example_gridworld_mdp/#Grid-World-Remaining-Functions">Grid World Remaining Functions</a></li><li><a href="example_gridworld_mdp/#Solving-the-Grid-World-MDP-(Value-Iteration)">Solving the Grid World MDP (Value Iteration)</a></li><li><a href="example_gridworld_mdp/#Solving-the-Grid-World-MDP-(MCTS)">Solving the Grid World MDP (MCTS)</a></li><li><a href="example_gridworld_mdp/#Visualizing-the-Value-Iteration-Policy">Visualizing the Value Iteration Policy</a></li><li><a href="example_gridworld_mdp/#Seeing-a-Policy-In-Action">Seeing a Policy In Action</a></li></ul></li><li><a href="gallery/#Gallery-of-POMDPs.jl-Problems">Gallery of POMDPs.jl Problems</a></li><li class="no-marker"><ul><li><a href="gallery/#[EscapeRoomba](https://github.com/sisl/AA228FinalProject)">EscapeRoomba</a></li><li><a href="gallery/#[DroneSurveillance](https://github.com/JuliaPOMDP/DroneSurveillance.jl)">DroneSurveillance</a></li><li><a href="gallery/#[QuickMountainCar](https://github.com/JuliaPOMDP/QuickPOMDPs.jl)">QuickMountainCar</a></li><li><a href="gallery/#[RockSample](https://github.com/JuliaPOMDP/RockSample.jl)">RockSample</a></li><li><a href="gallery/#[TagPOMDPProblem](https://github.com/JuliaPOMDP/TagPOMDPProblem.jl)">TagPOMDPProblem</a></li><li><a href="gallery/#Adding-New-Gallery-Examples">Adding New Gallery Examples</a></li></ul></li></ul><h3 id="POMDPTools-the-standard-library-for-POMDPs.jl"><a class="docs-heading-anchor" href="#POMDPTools-the-standard-library-for-POMDPs.jl">POMDPTools - the standard library for POMDPs.jl</a><a id="POMDPTools-the-standard-library-for-POMDPs.jl-1"></a><a class="docs-heading-anchor-permalink" href="#POMDPTools-the-standard-library-for-POMDPs.jl" title="Permalink"></a></h3><ul><li><a href="POMDPTools/#pomdptools_section">POMDPTools: the standard library for POMDPs.jl</a></li><li><a href="POMDPTools/distributions/#Implemented-Distributions">Implemented Distributions</a></li><li class="no-marker"><ul><li><a href="POMDPTools/distributions/#Sparse-Categorical-(SparseCat)">Sparse Categorical (<code>SparseCat</code>)</a></li><li><a href="POMDPTools/distributions/#Implicit">Implicit</a></li><li><a href="POMDPTools/distributions/#Bool-Distribution">Bool Distribution</a></li><li><a href="POMDPTools/distributions/#Deterministic">Deterministic</a></li><li><a href="POMDPTools/distributions/#Uniform">Uniform</a></li><li><a href="POMDPTools/distributions/#Pretty-Printing">Pretty Printing</a></li></ul></li><li><a href="POMDPTools/model/#Model-Tools">Model Tools</a></li><li class="no-marker"><ul><li><a href="POMDPTools/model/#Interface-Extensions">Interface Extensions</a></li><li><a href="POMDPTools/model/#Model-Transformations">Model Transformations</a></li><li><a href="POMDPTools/model/#Utility-Types">Utility Types</a></li></ul></li><li><a href="POMDPTools/visualization/#Visualization">Visualization</a></li><li><a href="POMDPTools/beliefs/#Implemented-Belief-Updaters">Implemented Belief Updaters</a></li><li class="no-marker"><ul><li><a href="POMDPTools/beliefs/#Discrete-(Bayesian-Filter)">Discrete (Bayesian Filter)</a></li><li><a href="POMDPTools/beliefs/#K-Previous-Observations">K Previous Observations</a></li><li><a href="POMDPTools/beliefs/#Previous-Observation">Previous Observation</a></li><li><a href="POMDPTools/beliefs/#Nothing-Updater">Nothing Updater</a></li></ul></li><li><a href="POMDPTools/policies/#Implemented-Policies">Implemented Policies</a></li><li class="no-marker"><ul><li><a href="POMDPTools/policies/#Function">Function</a></li><li><a href="POMDPTools/policies/#Alpha-Vector-Policy">Alpha Vector Policy</a></li><li><a href="POMDPTools/policies/#Random-Policy">Random Policy</a></li><li><a href="POMDPTools/policies/#Stochastic-Policies">Stochastic Policies</a></li><li><a href="POMDPTools/policies/#Vector-Policies">Vector Policies</a></li><li><a href="POMDPTools/policies/#Value-Dict-Policy">Value Dict Policy</a></li><li><a href="POMDPTools/policies/#Exploration-Policies">Exploration Policies</a></li><li><a href="POMDPTools/policies/#Playback-Policy">Playback Policy</a></li><li><a href="POMDPTools/policies/#Utility-Wrapper">Utility Wrapper</a></li><li><a href="POMDPTools/policies/#Pretty-Printing-Policies">Pretty Printing Policies</a></li></ul></li><li><a href="POMDPTools/policies/#Policy-Evaluation">Policy Evaluation</a></li><li><a href="POMDPTools/simulators/#Implemented-Simulators">Implemented Simulators</a></li><li class="no-marker"><ul><li><a href="POMDPTools/simulators/#which_simulator">Which Simulator Should I Use?</a></li><li><a href="POMDPTools/simulators/#Stepping-through">Stepping through</a></li><li><a href="POMDPTools/simulators/#Rollouts">Rollouts</a></li><li><a href="POMDPTools/simulators/#History-Recorder">History Recorder</a></li><li><a href="POMDPTools/simulators/#sim-function"><code>sim()</code></a></li><li><a href="POMDPTools/simulators/#Histories">Histories</a></li><li><a href="POMDPTools/simulators/#Parallel">Parallel</a></li><li><a href="POMDPTools/simulators/#Display">Display</a></li></ul></li><li><a href="POMDPTools/common_rl/#CommonRLInterface-Integration">CommonRLInterface Integration</a></li><li class="no-marker"><ul><li><a href="POMDPTools/common_rl/#Environment-Wrapper-Types">Environment Wrapper Types</a></li><li><a href="POMDPTools/common_rl/#Constructors">Constructors</a></li></ul></li><li><a href="POMDPTools/testing/#Testing">Testing</a></li><li class="no-marker"><ul><li><a href="POMDPTools/testing/#Testing-(PO)MDP-Models">Testing (PO)MDP Models</a></li><li><a href="POMDPTools/testing/#Testing-Solvers">Testing Solvers</a></li></ul></li></ul><h3 id="Reference"><a class="docs-heading-anchor" href="#Reference">Reference</a><a id="Reference-1"></a><a class="docs-heading-anchor-permalink" href="#Reference" title="Permalink"></a></h3><ul><li><a href="faq/#Frequently-Asked-Questions-(FAQ)">Frequently Asked Questions (FAQ)</a></li><li class="no-marker"><ul><li><a href="faq/#What-is-the-difference-between-transition,-gen,-and-@gen?">What is the difference between <code>transition</code>, <code>gen</code>, and <code>@gen</code>?</a></li><li><a href="faq/#How-do-I-save-my-policies?">How do I save my policies?</a></li><li><a href="faq/#Why-is-my-solver-producing-a-suboptimal-policy?">Why is my solver producing a suboptimal policy?</a></li><li><a href="faq/#What-if-I-don&#39;t-use-the-rng-argument?">What if I don&#39;t use the <code>rng</code> argument?</a></li><li><a href="faq/#Why-are-all-the-solvers-in-separate-modules?">Why are all the solvers in separate modules?</a></li><li><a href="faq/#How-can-I-implement-terminal-actions?">How can I implement terminal actions?</a></li><li><a href="faq/#Why-are-there-two-versions-of-reward?">Why are there two versions of <code>reward</code>?</a></li><li><a href="faq/#How-do-I-implement-reward(m,-s,-a)-if-the-reward-depends-on-the-next-state?">How do I implement <code>reward(m, s, a)</code> if the reward depends on the next state?</a></li><li><a href="faq/#Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?">Why do I need to put type assertions pomdp::POMDP into the function signature?</a></li></ul></li><li><a href="api/#API-Documentation">API Documentation</a></li><li class="no-marker"><ul><li><a href="api/#Contents">Contents</a></li><li><a href="api/#Index">Index</a></li><li><a href="api/#Types">Types</a></li><li><a href="api/#Model-Functions">Model Functions</a></li><li><a href="api/#Belief-Functions">Belief Functions</a></li><li><a href="api/#Policy-and-Solver-Functions">Policy and Solver Functions</a></li><li><a href="api/#Simulator">Simulator</a></li></ul></li></ul></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="install/">Installation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>POMDPs.jl · POMDPs.jl</title><meta name="title" content="POMDPs.jl · POMDPs.jl"/><meta property="og:title" content="POMDPs.jl · POMDPs.jl"/><meta property="twitter:title" content="POMDPs.jl · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="assets/documenter.js"></script><script src="search_index.js"></script><script src="siteinfo.js"></script><script src="../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href><img src="assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href>POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li class="is-active"><a class="tocitem" href>POMDPs.jl</a><ul class="internal"><li><a class="tocitem" href="#Package-and-Ecosystem-Features"><span>Package and Ecosystem Features</span></a></li><li><a class="tocitem" href="#Available-Packages"><span>Available Packages</span></a></li><li><a class="tocitem" href="#Documentation-Outline"><span>Documentation Outline</span></a></li></ul></li><li><a class="tocitem" href="install/">Installation</a></li><li><a class="tocitem" href="get_started/">Getting Started</a></li><li><a class="tocitem" href="concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="def_solver/">Solvers</a></li><li><a class="tocitem" href="offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="simulation/">Simulation Standard</a></li><li><a class="tocitem" href="run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="examples/">Examples</a></li><li><a class="tocitem" href="example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Basics</a></li><li class="is-active"><a href>POMDPs.jl</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>POMDPs.jl</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/index.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)"><a class="docs-heading-anchor" href="#[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)"><a href="https://github.com/JuliaPOMDP/POMDPs.jl">POMDPs.jl</a></a><a id="[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)-1"></a><a class="docs-heading-anchor-permalink" href="#[POMDPs.jl](https://github.com/JuliaPOMDP/POMDPs.jl)" title="Permalink"></a></h1><p><em>A Julia interface for defining, solving and simulating partially observable Markov decision processes and their fully observable counterparts.</em></p><h2 id="Package-and-Ecosystem-Features"><a class="docs-heading-anchor" href="#Package-and-Ecosystem-Features">Package and Ecosystem Features</a><a id="Package-and-Ecosystem-Features-1"></a><a class="docs-heading-anchor-permalink" href="#Package-and-Ecosystem-Features" title="Permalink"></a></h2><ul><li>General interface that can handle problems with discrete and continuous state/action/observation spaces</li><li>A number of popular state-of-the-art solvers implemented for use out-of-the-box</li><li>Tools that make it easy to define problems and simulate solutions</li><li>Simple integration of custom solvers into the existing interface</li></ul><h2 id="Available-Packages"><a class="docs-heading-anchor" href="#Available-Packages">Available Packages</a><a id="Available-Packages-1"></a><a class="docs-heading-anchor-permalink" href="#Available-Packages" title="Permalink"></a></h2><p>The POMDPs.jl package contains only the interface used for expressing and solving Markov decision processes (MDPs) and partially observable Markov decision processes (POMDPs). The <a href="POMDPTools/#pomdptools_section">POMDPTools</a> package acts as a &quot;standard library&quot; for the POMDPs.jl interface, providing implementations of commonly-used components such as policies, belief updaters, distributions, and simulators. The list of solver and support packages maintained by the <a href="https://github.com/JuliaPOMDP">JuliaPOMDP</a> community is available at the <a href="https://github.com/JuliaPOMDP/POMDPs.jl#supported-packages">POMDPs.jl Readme</a>.</p><h2 id="Documentation-Outline"><a class="docs-heading-anchor" href="#Documentation-Outline">Documentation Outline</a><a id="Documentation-Outline-1"></a><a class="docs-heading-anchor-permalink" href="#Documentation-Outline" title="Permalink"></a></h2><p>Documentation comes in three forms:</p><ol><li>An explanatory guide is available in the sections outlined below.</li><li>How-to examples are available throughout this documentation with specicic examples in <a href="examples/#examples_section">Examples</a> and <a href="gallery/#Gallery-of-POMDPs.jl-Problems">Gallery of POMDPs.jl Problems</a>.</li><li>Reference docstrings for the entire POMDPs.jl interface are available in the <a href="api/#API-Documentation">API Documentation</a> section.</li></ol><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>When updating these documents, make sure this is synced with <a href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/make.jl">docs/make.jl</a>!!</p></div></div><h3 id="Basics"><a class="docs-heading-anchor" href="#Basics">Basics</a><a id="Basics-1"></a><a class="docs-heading-anchor-permalink" href="#Basics" title="Permalink"></a></h3><ul><li><a href="install/#Installation">Installation</a></li><li><a href="get_started/#Getting-Started">Getting Started</a></li><li><a href="concepts/#Concepts-and-Architecture">Concepts and Architecture</a></li><li class="no-marker"><ul><li><a href="concepts/#POMDPs-and-MDPs">POMDPs and MDPs</a></li><li><a href="concepts/#Beliefs-and-Updaters">Beliefs and Updaters</a></li><li><a href="concepts/#Solvers-and-Policies">Solvers and Policies</a></li><li><a href="concepts/#Simulators">Simulators</a></li></ul></li></ul><h3 id="Defining-POMDP-Models"><a class="docs-heading-anchor" href="#Defining-POMDP-Models">Defining POMDP Models</a><a id="Defining-POMDP-Models-1"></a><a class="docs-heading-anchor-permalink" href="#Defining-POMDP-Models" title="Permalink"></a></h3><ul><li><a href="def_pomdp/#defining_pomdps">Defining POMDPs and MDPs</a></li><li class="no-marker"><ul><li><a href="def_pomdp/#tiger">A Basic Example: The Tiger POMDP</a></li><li><a href="def_pomdp/#Guide-to-Defining-POMDPs">Guide to Defining POMDPs</a></li><li class="no-marker"><ul><li><a href="def_pomdp/#po-mountaincar">A more complex example: A partially-observable mountain car</a></li><li><a href="def_pomdp/#space_representation">State, action, and observation spaces</a></li><li><a href="def_pomdp/#Transition-and-observation-distributions-2">Transition and observation distributions</a></li><li><a href="def_pomdp/#Reward-functions">Reward functions</a></li><li><a href="def_pomdp/#Other-Components">Other Components</a></li></ul></li><li><a href="def_pomdp/#Other-ways-to-define-a-(PO)MDP">Other ways to define a (PO)MDP</a></li><li class="no-marker"><ul><li><a href="def_pomdp/#Object-oriented">Object-oriented</a></li><li><a href="def_pomdp/#Using-a-single-generative-function-instead-of-separate-T,-Z,-and-R">Using a single generative function instead of separate <span>$T$</span>, <span>$Z$</span>, and <span>$R$</span></a></li><li><a href="def_pomdp/#Tabular">Tabular</a></li></ul></li></ul></li><li><a href="interfaces/#Spaces-and-Distributions">Spaces and Distributions</a></li><li class="no-marker"><ul><li><a href="interfaces/#space-interface">Spaces</a></li><li><a href="interfaces/#Distributions">Distributions</a></li></ul></li></ul><h3 id="Writing-Solvers-and-Updaters"><a class="docs-heading-anchor" href="#Writing-Solvers-and-Updaters">Writing Solvers and Updaters</a><a id="Writing-Solvers-and-Updaters-1"></a><a class="docs-heading-anchor-permalink" href="#Writing-Solvers-and-Updaters" title="Permalink"></a></h3><ul><li><a href="def_solver/#Solvers">Solvers</a></li><li class="no-marker"><ul><li><a href="def_solver/#Online-and-Offline-Solvers">Online and Offline Solvers</a></li><li><a href="def_solver/#Examples">Examples</a></li></ul></li><li><a href="offline_solver/#Example:-Defining-an-offline-solver">Example: Defining an offline solver</a></li><li><a href="online_solver/#Example:-Defining-an-online-solver">Example: Defining an online solver</a></li><li><a href="def_updater/#Defining-a-Belief-Updater">Defining a Belief Updater</a></li><li class="no-marker"><ul><li><a href="def_updater/#Defining-a-Belief-Type">Defining a Belief Type</a></li><li><a href="def_updater/#Defining-an-Updater">Defining an Updater</a></li></ul></li></ul><h3 id="Analyzing-Results"><a class="docs-heading-anchor" href="#Analyzing-Results">Analyzing Results</a><a id="Analyzing-Results-1"></a><a class="docs-heading-anchor-permalink" href="#Analyzing-Results" title="Permalink"></a></h3><ul><li><a href="simulation/#Simulation-Standard">Simulation Standard</a></li><li class="no-marker"><ul><li><a href="simulation/#POMDP-Simulation">POMDP Simulation</a></li><li><a href="simulation/#MDP-Simulation">MDP Simulation</a></li></ul></li><li><a href="run_simulation/#Running-Simulations">Running Simulations</a></li><li><a href="policy_interaction/#Interacting-with-Policies">Interacting with Policies</a></li></ul><h3 id="Examples-and-Gallery"><a class="docs-heading-anchor" href="#Examples-and-Gallery">Examples and Gallery</a><a id="Examples-and-Gallery-1"></a><a class="docs-heading-anchor-permalink" href="#Examples-and-Gallery" title="Permalink"></a></h3><ul><li><a href="examples/#examples_section">Examples</a></li><li class="no-marker"><ul><li><a href="examples/#Outline">Outline</a></li></ul></li><li><a href="example_defining_problems/#Defining-a-POMDP">Defining a POMDP</a></li><li class="no-marker"><ul><li><a href="example_defining_problems/#CryingBaby-Problem-Definition">CryingBaby Problem Definition</a></li><li><a href="example_defining_problems/#quick_crying">QuickPOMDP Interface</a></li><li><a href="example_defining_problems/#explicit_crying">Explicit Interface</a></li><li><a href="example_defining_problems/#gen_crying">Generative Interface</a></li><li><a href="example_defining_problems/#tab_crying">Probability Tables</a></li></ul></li><li><a href="example_solvers/#Using-Different-Solvers">Using Different Solvers</a></li><li class="no-marker"><ul><li><a href="example_solvers/#Checking-Requirements">Checking Requirements</a></li><li><a href="example_solvers/#Offline-(SARSOP)">Offline (SARSOP)</a></li><li><a href="example_solvers/#Online-(POMCP)">Online (POMCP)</a></li><li><a href="example_solvers/#Heuristic-Policy">Heuristic Policy</a></li></ul></li><li><a href="example_simulations/#Simulations-Examples">Simulations Examples</a></li><li class="no-marker"><ul><li><a href="example_simulations/#Stepthrough">Stepthrough</a></li><li><a href="example_simulations/#Rollout-Simulations">Rollout Simulations</a></li><li><a href="example_simulations/#Recording-Histories">Recording Histories</a></li><li><a href="example_simulations/#Parallel-Simulations">Parallel Simulations</a></li></ul></li><li><a href="example_gridworld_mdp/#GridWorld-MDP-Tutorial">GridWorld MDP Tutorial</a></li><li class="no-marker"><ul><li><a href="example_gridworld_mdp/#Dependencies">Dependencies</a></li><li><a href="example_gridworld_mdp/#Problem-Overview">Problem Overview</a></li><li><a href="example_gridworld_mdp/#Defining-the-Grid-World-MDP-Type">Defining the Grid World MDP Type</a></li><li><a href="example_gridworld_mdp/#Grid-World-State-Space">Grid World State Space</a></li><li><a href="example_gridworld_mdp/#Grid-World-Action-Space">Grid World Action Space</a></li><li><a href="example_gridworld_mdp/#Grid-World-Transition-Function">Grid World Transition Function</a></li><li><a href="example_gridworld_mdp/#Grid-World-Reward-Function">Grid World Reward Function</a></li><li><a href="example_gridworld_mdp/#Grid-World-Remaining-Functions">Grid World Remaining Functions</a></li><li><a href="example_gridworld_mdp/#Solving-the-Grid-World-MDP-(Value-Iteration)">Solving the Grid World MDP (Value Iteration)</a></li><li><a href="example_gridworld_mdp/#Solving-the-Grid-World-MDP-(MCTS)">Solving the Grid World MDP (MCTS)</a></li><li><a href="example_gridworld_mdp/#Visualizing-the-Value-Iteration-Policy">Visualizing the Value Iteration Policy</a></li><li><a href="example_gridworld_mdp/#Seeing-a-Policy-In-Action">Seeing a Policy In Action</a></li></ul></li><li><a href="gallery/#Gallery-of-POMDPs.jl-Problems">Gallery of POMDPs.jl Problems</a></li><li class="no-marker"><ul><li><a href="gallery/#[EscapeRoomba](https://github.com/sisl/AA228FinalProject)">EscapeRoomba</a></li><li><a href="gallery/#[DroneSurveillance](https://github.com/JuliaPOMDP/DroneSurveillance.jl)">DroneSurveillance</a></li><li><a href="gallery/#[QuickMountainCar](https://github.com/JuliaPOMDP/QuickPOMDPs.jl)">QuickMountainCar</a></li><li><a href="gallery/#[RockSample](https://github.com/JuliaPOMDP/RockSample.jl)">RockSample</a></li><li><a href="gallery/#[TagPOMDPProblem](https://github.com/JuliaPOMDP/TagPOMDPProblem.jl)">TagPOMDPProblem</a></li><li><a href="gallery/#Adding-New-Gallery-Examples">Adding New Gallery Examples</a></li></ul></li></ul><h3 id="POMDPTools-the-standard-library-for-POMDPs.jl"><a class="docs-heading-anchor" href="#POMDPTools-the-standard-library-for-POMDPs.jl">POMDPTools - the standard library for POMDPs.jl</a><a id="POMDPTools-the-standard-library-for-POMDPs.jl-1"></a><a class="docs-heading-anchor-permalink" href="#POMDPTools-the-standard-library-for-POMDPs.jl" title="Permalink"></a></h3><ul><li><a href="POMDPTools/#pomdptools_section">POMDPTools: the standard library for POMDPs.jl</a></li><li><a href="POMDPTools/distributions/#Implemented-Distributions">Implemented Distributions</a></li><li class="no-marker"><ul><li><a href="POMDPTools/distributions/#Sparse-Categorical-(SparseCat)">Sparse Categorical (<code>SparseCat</code>)</a></li><li><a href="POMDPTools/distributions/#Implicit">Implicit</a></li><li><a href="POMDPTools/distributions/#Bool-Distribution">Bool Distribution</a></li><li><a href="POMDPTools/distributions/#Deterministic">Deterministic</a></li><li><a href="POMDPTools/distributions/#Uniform">Uniform</a></li><li><a href="POMDPTools/distributions/#Pretty-Printing">Pretty Printing</a></li></ul></li><li><a href="POMDPTools/model/#Model-Tools">Model Tools</a></li><li class="no-marker"><ul><li><a href="POMDPTools/model/#Interface-Extensions">Interface Extensions</a></li><li><a href="POMDPTools/model/#Model-Transformations">Model Transformations</a></li><li><a href="POMDPTools/model/#Utility-Types">Utility Types</a></li></ul></li><li><a href="POMDPTools/visualization/#Visualization">Visualization</a></li><li><a href="POMDPTools/beliefs/#Implemented-Belief-Updaters">Implemented Belief Updaters</a></li><li class="no-marker"><ul><li><a href="POMDPTools/beliefs/#Discrete-(Bayesian-Filter)">Discrete (Bayesian Filter)</a></li><li><a href="POMDPTools/beliefs/#K-Previous-Observations">K Previous Observations</a></li><li><a href="POMDPTools/beliefs/#Previous-Observation">Previous Observation</a></li><li><a href="POMDPTools/beliefs/#Nothing-Updater">Nothing Updater</a></li></ul></li><li><a href="POMDPTools/policies/#Implemented-Policies">Implemented Policies</a></li><li class="no-marker"><ul><li><a href="POMDPTools/policies/#Function">Function</a></li><li><a href="POMDPTools/policies/#Alpha-Vector-Policy">Alpha Vector Policy</a></li><li><a href="POMDPTools/policies/#Random-Policy">Random Policy</a></li><li><a href="POMDPTools/policies/#Stochastic-Policies">Stochastic Policies</a></li><li><a href="POMDPTools/policies/#Vector-Policies">Vector Policies</a></li><li><a href="POMDPTools/policies/#Value-Dict-Policy">Value Dict Policy</a></li><li><a href="POMDPTools/policies/#Exploration-Policies">Exploration Policies</a></li><li><a href="POMDPTools/policies/#Playback-Policy">Playback Policy</a></li><li><a href="POMDPTools/policies/#Utility-Wrapper">Utility Wrapper</a></li><li><a href="POMDPTools/policies/#Pretty-Printing-Policies">Pretty Printing Policies</a></li></ul></li><li><a href="POMDPTools/policies/#Policy-Evaluation">Policy Evaluation</a></li><li><a href="POMDPTools/simulators/#Implemented-Simulators">Implemented Simulators</a></li><li class="no-marker"><ul><li><a href="POMDPTools/simulators/#which_simulator">Which Simulator Should I Use?</a></li><li><a href="POMDPTools/simulators/#Stepping-through">Stepping through</a></li><li><a href="POMDPTools/simulators/#Rollouts">Rollouts</a></li><li><a href="POMDPTools/simulators/#History-Recorder">History Recorder</a></li><li><a href="POMDPTools/simulators/#sim-function"><code>sim()</code></a></li><li><a href="POMDPTools/simulators/#Histories">Histories</a></li><li><a href="POMDPTools/simulators/#Parallel">Parallel</a></li><li><a href="POMDPTools/simulators/#Display">Display</a></li></ul></li><li><a href="POMDPTools/common_rl/#CommonRLInterface-Integration">CommonRLInterface Integration</a></li><li class="no-marker"><ul><li><a href="POMDPTools/common_rl/#Environment-Wrapper-Types">Environment Wrapper Types</a></li><li><a href="POMDPTools/common_rl/#Constructors">Constructors</a></li></ul></li><li><a href="POMDPTools/testing/#Testing">Testing</a></li><li class="no-marker"><ul><li><a href="POMDPTools/testing/#Testing-(PO)MDP-Models">Testing (PO)MDP Models</a></li><li><a href="POMDPTools/testing/#Testing-Solvers">Testing Solvers</a></li></ul></li></ul><h3 id="Reference"><a class="docs-heading-anchor" href="#Reference">Reference</a><a id="Reference-1"></a><a class="docs-heading-anchor-permalink" href="#Reference" title="Permalink"></a></h3><ul><li><a href="faq/#Frequently-Asked-Questions-(FAQ)">Frequently Asked Questions (FAQ)</a></li><li class="no-marker"><ul><li><a href="faq/#What-is-the-difference-between-transition,-gen,-and-@gen?">What is the difference between <code>transition</code>, <code>gen</code>, and <code>@gen</code>?</a></li><li><a href="faq/#How-do-I-save-my-policies?">How do I save my policies?</a></li><li><a href="faq/#Why-is-my-solver-producing-a-suboptimal-policy?">Why is my solver producing a suboptimal policy?</a></li><li><a href="faq/#What-if-I-don&#39;t-use-the-rng-argument?">What if I don&#39;t use the <code>rng</code> argument?</a></li><li><a href="faq/#Why-are-all-the-solvers-in-separate-modules?">Why are all the solvers in separate modules?</a></li><li><a href="faq/#How-can-I-implement-terminal-actions?">How can I implement terminal actions?</a></li><li><a href="faq/#Why-are-there-two-versions-of-reward?">Why are there two versions of <code>reward</code>?</a></li><li><a href="faq/#How-do-I-implement-reward(m,-s,-a)-if-the-reward-depends-on-the-next-state?">How do I implement <code>reward(m, s, a)</code> if the reward depends on the next state?</a></li><li><a href="faq/#Why-do-I-need-to-put-type-assertions-pomdp::POMDP-into-the-function-signature?">Why do I need to put type assertions pomdp::POMDP into the function signature?</a></li></ul></li><li><a href="api/#API-Documentation">API Documentation</a></li><li class="no-marker"><ul><li><a href="api/#Contents">Contents</a></li><li><a href="api/#Index">Index</a></li><li><a href="api/#Types">Types</a></li><li><a href="api/#Model-Functions">Model Functions</a></li><li><a href="api/#Belief-Functions">Belief Functions</a></li><li><a href="api/#Policy-and-Solver-Functions">Policy and Solver Functions</a></li><li><a href="api/#Simulator">Simulator</a></li></ul></li></ul></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="install/">Installation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/install/index.html b/dev/install/index.html
index c2a75397..abc2ce52 100644
--- a/dev/install/index.html
+++ b/dev/install/index.html
@@ -1,3 +1,3 @@
 <!DOCTYPE html>
 <html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Installation · POMDPs.jl</title><meta name="title" content="Installation · POMDPs.jl"/><meta property="og:title" content="Installation · POMDPs.jl"/><meta property="twitter:title" content="Installation · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li class="is-active"><a class="tocitem" href>Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Basics</a></li><li class="is-active"><a href>Installation</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Installation</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/install.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Installation"><a class="docs-heading-anchor" href="#Installation">Installation</a><a id="Installation-1"></a><a class="docs-heading-anchor-permalink" href="#Installation" title="Permalink"></a></h1><p>If you have a running Julia distribution (Julia 0.4 or greater), you have everything you need to install POMDPs.jl. To install the package, simply run the following from the Julia REPL:</p><pre><code class="language-julia hljs">import Pkg
-Pkg.add(&quot;POMDPs&quot;) # installs the POMDPs.jl package</code></pre><p>Some auxiliary packages and older versions of solvers may be found in the JuliaPOMDP registry. To install this registry, run:</p><pre><code class="language-julia hljs">using Pkg; pkg&quot;registry add https://github.com/JuliaPOMDP/Registry&quot;</code></pre><p>Note: to use this registry, <a href="https://juliacomputing.com/products/juliapro">JuliaPro</a> users must also run <code>edit(normpath(Sys.BINDIR,&quot;..&quot;,&quot;etc&quot;,&quot;julia&quot;,&quot;startup.jl&quot;))</code>, comment out the line <code>ENV[&quot;DISABLE_FALLBACK&quot;] = &quot;true&quot;</code>, save the file, and restart JuliaPro as described in <a href="https://github.com/JuliaPOMDP/POMDPs.jl/issues/249">this issue</a>.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../">« POMDPs.jl</a><a class="docs-footer-nextpage" href="../get_started/">Getting Started »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+Pkg.add(&quot;POMDPs&quot;) # installs the POMDPs.jl package</code></pre><p>Some auxiliary packages and older versions of solvers may be found in the JuliaPOMDP registry. To install this registry, run:</p><pre><code class="language-julia hljs">using Pkg; pkg&quot;registry add https://github.com/JuliaPOMDP/Registry&quot;</code></pre><p>Note: to use this registry, <a href="https://juliacomputing.com/products/juliapro">JuliaPro</a> users must also run <code>edit(normpath(Sys.BINDIR,&quot;..&quot;,&quot;etc&quot;,&quot;julia&quot;,&quot;startup.jl&quot;))</code>, comment out the line <code>ENV[&quot;DISABLE_FALLBACK&quot;] = &quot;true&quot;</code>, save the file, and restart JuliaPro as described in <a href="https://github.com/JuliaPOMDP/POMDPs.jl/issues/249">this issue</a>.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../">« POMDPs.jl</a><a class="docs-footer-nextpage" href="../get_started/">Getting Started »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/interfaces/index.html b/dev/interfaces/index.html
index 965be55c..c5137070 100644
--- a/dev/interfaces/index.html
+++ b/dev/interfaces/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Spaces and Distributions · POMDPs.jl</title><meta name="title" content="Spaces and Distributions · POMDPs.jl"/><meta property="og:title" content="Spaces and Distributions · POMDPs.jl"/><meta property="twitter:title" content="Spaces and Distributions · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li class="is-active"><a class="tocitem" href>Spaces and Distributions</a><ul class="internal"><li><a class="tocitem" href="#space-interface"><span>Spaces</span></a></li><li><a class="tocitem" href="#Distributions"><span>Distributions</span></a></li></ul></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Defining (PO)MDP Models</a></li><li class="is-active"><a href>Spaces and Distributions</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Spaces and Distributions</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/interfaces.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Spaces-and-Distributions"><a class="docs-heading-anchor" href="#Spaces-and-Distributions">Spaces and Distributions</a><a id="Spaces-and-Distributions-1"></a><a class="docs-heading-anchor-permalink" href="#Spaces-and-Distributions" title="Permalink"></a></h1><p>Two important components of the definitions of MDPs and POMDPs are <em>spaces</em>, which specify the possible states, actions, and observations in a problem and <em>distributions</em>, which define probability distributions. In order to provide for maximum flexibility spaces and distributions may be of any type (i.e. there are no abstract base types). Solvers and simulators will interact with space and distribution types using the functions defined below.</p><h2 id="space-interface"><a class="docs-heading-anchor" href="#space-interface">Spaces</a><a id="space-interface-1"></a><a class="docs-heading-anchor-permalink" href="#space-interface" title="Permalink"></a></h2><p>A space object should contain the information needed to define the set of all possible states, actions or observations. The implementation will depend on the attributes of the elements. For example, if the space is continuous, the space object may only contain the limits of the continuous range. In the case of a discrete problem, a vector containing all states is appropriate for representing a space.</p><p>The following functions may be called on a space object (Click on a function to read its documentation):</p><ul><li><a href="../api/#Base.rand"><code>rand</code></a></li><li><a href="https://docs.julialang.org/en/v1/manual/interfaces/#man-interface-iteration-1"><code>iterate</code></a> and <a href="https://docs.julialang.org/en/v1/manual/interfaces/#man-interface-iteration-1">the rest of the iteration interface</a> for discrete spaces.</li></ul><h2 id="Distributions"><a class="docs-heading-anchor" href="#Distributions">Distributions</a><a id="Distributions-1"></a><a class="docs-heading-anchor-permalink" href="#Distributions" title="Permalink"></a></h2><p>A distribution object represents a probability distribution.</p><p>The following functions may be called on a distribution object (Click on a function to read its documentation):</p><ul><li><a href="../api/#Base.rand"><code>rand</code></a><code>([rng,] d)</code> <sup class="footnote-reference"><a id="citeref-1" href="#footnote-1">[1]</a></sup></li><li><a href="../api/#Distributions.support"><code>support</code></a></li><li><a href="../api/#Distributions.pdf"><code>pdf</code></a></li><li><a href="../api/#StatsBase.mode"><code>mode</code></a></li><li><a href="../api/#Statistics.mean"><code>mean</code></a></li></ul><p>You can find some useful pre-made distribution objects in <a href="https://github.com/JuliaStats/Distributions.jl">Distributions.jl</a> or <a href="../POMDPTools/#pomdptools_section">POMDPTools</a>.</p><section class="footnotes is-size-7"><ul><li class="footnote" id="footnote-1"><a class="tag is-link" href="#citeref-1">1</a>Distributions should support both <code>rand(rng::AbstractRNG, d)</code> and <code>rand(d)</code>. The recommended way to do this is by implmenting <code>Base.rand(rng::AbstractRNG, s::Random.SamplerTrivial{&lt;:YourDistribution})</code> from the <a href="https://docs.julialang.org/en/v1/stdlib/Random/index.html#Generating-values-from-a-collection-1">julia rand interface</a>.</li></ul></section></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../def_pomdp/">« Defining POMDPs and MDPs</a><a class="docs-footer-nextpage" href="../def_solver/">Solvers »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Spaces and Distributions · POMDPs.jl</title><meta name="title" content="Spaces and Distributions · POMDPs.jl"/><meta property="og:title" content="Spaces and Distributions · POMDPs.jl"/><meta property="twitter:title" content="Spaces and Distributions · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li class="is-active"><a class="tocitem" href>Spaces and Distributions</a><ul class="internal"><li><a class="tocitem" href="#space-interface"><span>Spaces</span></a></li><li><a class="tocitem" href="#Distributions"><span>Distributions</span></a></li></ul></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Defining (PO)MDP Models</a></li><li class="is-active"><a href>Spaces and Distributions</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Spaces and Distributions</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/interfaces.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Spaces-and-Distributions"><a class="docs-heading-anchor" href="#Spaces-and-Distributions">Spaces and Distributions</a><a id="Spaces-and-Distributions-1"></a><a class="docs-heading-anchor-permalink" href="#Spaces-and-Distributions" title="Permalink"></a></h1><p>Two important components of the definitions of MDPs and POMDPs are <em>spaces</em>, which specify the possible states, actions, and observations in a problem and <em>distributions</em>, which define probability distributions. In order to provide for maximum flexibility spaces and distributions may be of any type (i.e. there are no abstract base types). Solvers and simulators will interact with space and distribution types using the functions defined below.</p><h2 id="space-interface"><a class="docs-heading-anchor" href="#space-interface">Spaces</a><a id="space-interface-1"></a><a class="docs-heading-anchor-permalink" href="#space-interface" title="Permalink"></a></h2><p>A space object should contain the information needed to define the set of all possible states, actions or observations. The implementation will depend on the attributes of the elements. For example, if the space is continuous, the space object may only contain the limits of the continuous range. In the case of a discrete problem, a vector containing all states is appropriate for representing a space.</p><p>The following functions may be called on a space object (Click on a function to read its documentation):</p><ul><li><a href="../api/#Base.rand"><code>rand</code></a></li><li><a href="https://docs.julialang.org/en/v1/manual/interfaces/#man-interface-iteration-1"><code>iterate</code></a> and <a href="https://docs.julialang.org/en/v1/manual/interfaces/#man-interface-iteration-1">the rest of the iteration interface</a> for discrete spaces.</li></ul><h2 id="Distributions"><a class="docs-heading-anchor" href="#Distributions">Distributions</a><a id="Distributions-1"></a><a class="docs-heading-anchor-permalink" href="#Distributions" title="Permalink"></a></h2><p>A distribution object represents a probability distribution.</p><p>The following functions may be called on a distribution object (Click on a function to read its documentation):</p><ul><li><a href="../api/#Base.rand"><code>rand</code></a><code>([rng,] d)</code> <sup class="footnote-reference"><a id="citeref-1" href="#footnote-1">[1]</a></sup></li><li><a href="../api/#Distributions.support"><code>support</code></a></li><li><a href="../api/#Distributions.pdf"><code>pdf</code></a></li><li><a href="../api/#StatsBase.mode"><code>mode</code></a></li><li><a href="../api/#Statistics.mean"><code>mean</code></a></li></ul><p>You can find some useful pre-made distribution objects in <a href="https://github.com/JuliaStats/Distributions.jl">Distributions.jl</a> or <a href="../POMDPTools/#pomdptools_section">POMDPTools</a>.</p><section class="footnotes is-size-7"><ul><li class="footnote" id="footnote-1"><a class="tag is-link" href="#citeref-1">1</a>Distributions should support both <code>rand(rng::AbstractRNG, d)</code> and <code>rand(d)</code>. The recommended way to do this is by implmenting <code>Base.rand(rng::AbstractRNG, s::Random.SamplerTrivial{&lt;:YourDistribution})</code> from the <a href="https://docs.julialang.org/en/v1/stdlib/Random/index.html#Generating-values-from-a-collection-1">julia rand interface</a>.</li></ul></section></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../def_pomdp/">« Defining POMDPs and MDPs</a><a class="docs-footer-nextpage" href="../def_solver/">Solvers »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/offline_solver/index.html b/dev/offline_solver/index.html
index dd8922ec..6b5fe88a 100644
--- a/dev/offline_solver/index.html
+++ b/dev/offline_solver/index.html
@@ -70,4 +70,4 @@
 
 @assert action(policy, Deterministic(TIGER_LEFT)) == TIGER_OPEN_RIGHT
 @assert action(policy, Deterministic(TIGER_RIGHT)) == TIGER_OPEN_LEFT
-@assert action(policy, Uniform(states(tiger))) == TIGER_LISTEN</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../def_solver/">« Solvers</a><a class="docs-footer-nextpage" href="../online_solver/">Example: Defining an online solver »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+@assert action(policy, Uniform(states(tiger))) == TIGER_LISTEN</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../def_solver/">« Solvers</a><a class="docs-footer-nextpage" href="../online_solver/">Example: Defining an online solver »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/online_solver/index.html b/dev/online_solver/index.html
index f88bfaa6..e9ba07b2 100644
--- a/dev/online_solver/index.html
+++ b/dev/online_solver/index.html
@@ -56,4 +56,4 @@
 
 @assert action(planner, Deterministic(TIGER_LEFT)) == TIGER_OPEN_RIGHT
 @assert action(planner, Deterministic(TIGER_RIGHT)) == TIGER_OPEN_LEFT
-# note action(planner, Uniform(states(tiger))) is not very reliable with this number of samples</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../offline_solver/">« Example: Defining an offline solver</a><a class="docs-footer-nextpage" href="../def_updater/">Defining a Belief Updater »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+# note action(planner, Uniform(states(tiger))) is not very reliable with this number of samples</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../offline_solver/">« Example: Defining an offline solver</a><a class="docs-footer-nextpage" href="../def_updater/">Defining a Belief Updater »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/policy_interaction/index.html b/dev/policy_interaction/index.html
index 4bb17a4c..58b9a121 100644
--- a/dev/policy_interaction/index.html
+++ b/dev/policy_interaction/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Interacting with Policies · POMDPs.jl</title><meta name="title" content="Interacting with Policies · POMDPs.jl"/><meta property="og:title" content="Interacting with Policies · POMDPs.jl"/><meta property="twitter:title" content="Interacting with Policies · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li class="is-active"><a class="tocitem" href>Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Analyzing Results</a></li><li class="is-active"><a href>Interacting with Policies</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Interacting with Policies</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/policy_interaction.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Interacting-with-Policies"><a class="docs-heading-anchor" href="#Interacting-with-Policies">Interacting with Policies</a><a id="Interacting-with-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Interacting-with-Policies" title="Permalink"></a></h1><p>A solution to a POMDP is a policy that maps beliefs or action-observation histories to actions. In POMDPs.jl, these are represented by <a href="../api/#POMDPs.Policy"><code>Policy</code></a> objects. See <a href="../concepts/#Solvers-and-Policies">Solvers and Policies</a> for more information about what a policy can represent in general.</p><p>One common task in evaluating POMDP solutions is examining the policies themselves. Since the internal representation of a policy is an esoteric implementation detail, it is best to interact with policies through the <code>action</code> and <code>value</code> interface functions. There are three relevant methods</p><ul><li><a href="../api/#POMDPs.action"><code>action(policy, s)</code></a> returns the best action (or one of the best) for the given state or belief.</li><li><a href="../api/#POMDPs.value"><code>value(policy, s)</code></a> returns the expected sum of future rewards if the policy is executed.</li><li><a href="../api/#POMDPs.value"><code>value(policy, s, a)</code></a> returns the &quot;Q-value&quot;, that is, the expected sum of rewards if action a is taken on the next step and then the policy is executed.</li></ul><p>Note that the quantities returned by these functions are what the policy/solver expects to be the case after its (usually approximate) computations; they may be far from the true value if the solution is not exactly optimal.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../run_simulation/">« Running Simulations</a><a class="docs-footer-nextpage" href="../examples/">Examples »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Interacting with Policies · POMDPs.jl</title><meta name="title" content="Interacting with Policies · POMDPs.jl"/><meta property="og:title" content="Interacting with Policies · POMDPs.jl"/><meta property="twitter:title" content="Interacting with Policies · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li><a class="tocitem" href="../run_simulation/">Running Simulations</a></li><li class="is-active"><a class="tocitem" href>Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Analyzing Results</a></li><li class="is-active"><a href>Interacting with Policies</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Interacting with Policies</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/policy_interaction.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Interacting-with-Policies"><a class="docs-heading-anchor" href="#Interacting-with-Policies">Interacting with Policies</a><a id="Interacting-with-Policies-1"></a><a class="docs-heading-anchor-permalink" href="#Interacting-with-Policies" title="Permalink"></a></h1><p>A solution to a POMDP is a policy that maps beliefs or action-observation histories to actions. In POMDPs.jl, these are represented by <a href="../api/#POMDPs.Policy"><code>Policy</code></a> objects. See <a href="../concepts/#Solvers-and-Policies">Solvers and Policies</a> for more information about what a policy can represent in general.</p><p>One common task in evaluating POMDP solutions is examining the policies themselves. Since the internal representation of a policy is an esoteric implementation detail, it is best to interact with policies through the <code>action</code> and <code>value</code> interface functions. There are three relevant methods</p><ul><li><a href="../api/#POMDPs.action"><code>action(policy, s)</code></a> returns the best action (or one of the best) for the given state or belief.</li><li><a href="../api/#POMDPs.value"><code>value(policy, s)</code></a> returns the expected sum of future rewards if the policy is executed.</li><li><a href="../api/#POMDPs.value"><code>value(policy, s, a)</code></a> returns the &quot;Q-value&quot;, that is, the expected sum of rewards if action a is taken on the next step and then the policy is executed.</li></ul><p>Note that the quantities returned by these functions are what the policy/solver expects to be the case after its (usually approximate) computations; they may be far from the true value if the solution is not exactly optimal.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../run_simulation/">« Running Simulations</a><a class="docs-footer-nextpage" href="../examples/">Examples »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/run_simulation/index.html b/dev/run_simulation/index.html
index 113fb201..b4539b1f 100644
--- a/dev/run_simulation/index.html
+++ b/dev/run_simulation/index.html
@@ -1,3 +1,3 @@
 <!DOCTYPE html>
 <html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Running Simulations · POMDPs.jl</title><meta name="title" content="Running Simulations · POMDPs.jl"/><meta property="og:title" content="Running Simulations · POMDPs.jl"/><meta property="twitter:title" content="Running Simulations · POMDPs.jl"/><meta name="description" content="Documentation for POMDPs.jl."/><meta property="og:description" content="Documentation for POMDPs.jl."/><meta property="twitter:description" content="Documentation for POMDPs.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../"><img src="../assets/logo.png" alt="POMDPs.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../">POMDPs.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><span class="tocitem">Basics</span><ul><li><a class="tocitem" href="../">POMDPs.jl</a></li><li><a class="tocitem" href="../install/">Installation</a></li><li><a class="tocitem" href="../get_started/">Getting Started</a></li><li><a class="tocitem" href="../concepts/">Concepts and Architecture</a></li></ul></li><li><span class="tocitem">Defining (PO)MDP Models</span><ul><li><a class="tocitem" href="../def_pomdp/">Defining POMDPs and MDPs</a></li><li><a class="tocitem" href="../interfaces/">Spaces and Distributions</a></li></ul></li><li><span class="tocitem">Writing Solvers</span><ul><li><a class="tocitem" href="../def_solver/">Solvers</a></li><li><a class="tocitem" href="../offline_solver/">Example: Defining an offline solver</a></li><li><a class="tocitem" href="../online_solver/">Example: Defining an online solver</a></li></ul></li><li><span class="tocitem">Writing Belief Updaters</span><ul><li><a class="tocitem" href="../def_updater/">Defining a Belief Updater</a></li></ul></li><li><span class="tocitem">Analyzing Results</span><ul><li><a class="tocitem" href="../simulation/">Simulation Standard</a></li><li class="is-active"><a class="tocitem" href>Running Simulations</a></li><li><a class="tocitem" href="../policy_interaction/">Interacting with Policies</a></li></ul></li><li><span class="tocitem">Examples and Gallery</span><ul><li><a class="tocitem" href="../examples/">Examples</a></li><li><a class="tocitem" href="../example_defining_problems/">Defining a POMDP</a></li><li><a class="tocitem" href="../example_solvers/">Using Different Solvers</a></li><li><a class="tocitem" href="../example_simulations/">Simulations Examples</a></li><li><a class="tocitem" href="../example_gridworld_mdp/">GridWorld MDP Tutorial</a></li><li><a class="tocitem" href="../gallery/">Gallery of POMDPs.jl Problems</a></li></ul></li><li><span class="tocitem">POMDPTools</span><ul><li><a class="tocitem" href="../POMDPTools/">POMDPTools: the standard library for POMDPs.jl</a></li><li><a class="tocitem" href="../POMDPTools/distributions/">Implemented Distributions</a></li><li><a class="tocitem" href="../POMDPTools/model/">Model Tools</a></li><li><a class="tocitem" href="../POMDPTools/visualization/">Visualization</a></li><li><a class="tocitem" href="../POMDPTools/beliefs/">Implemented Belief Updaters</a></li><li><a class="tocitem" href="../POMDPTools/policies/">Implemented Policies</a></li><li><a class="tocitem" href="../POMDPTools/simulators/">Implemented Simulators</a></li><li><a class="tocitem" href="../POMDPTools/common_rl/">CommonRLInterface Integration</a></li><li><a class="tocitem" href="../POMDPTools/testing/">Testing</a></li></ul></li><li><a class="tocitem" href="../faq/">Frequently Asked Questions (FAQ)</a></li><li><a class="tocitem" href="../api/">API Documentation</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Analyzing Results</a></li><li class="is-active"><a href>Running Simulations</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Running Simulations</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaPOMDP/POMDPs.jl/blob/master/docs/src/run_simulation.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Running-Simulations"><a class="docs-heading-anchor" href="#Running-Simulations">Running Simulations</a><a id="Running-Simulations-1"></a><a class="docs-heading-anchor-permalink" href="#Running-Simulations" title="Permalink"></a></h1><p>Running a simulation consists of two steps, creating a simulator and calling the <a href="../api/#POMDPs.simulate"><code>simulate</code></a> function. For example, given a POMDP or MDP model <code>m</code>, and a policy <code>p</code>, one can use the <a href="../POMDPTools/simulators/#POMDPTools.Simulators.RolloutSimulator"><code>RolloutSimulator</code></a> from <a href="../POMDPTools/#pomdptools_section">POMDPTools</a> to find the accumulated discounted reward from a single simulated trajectory as follows:</p><pre><code class="language-julia hljs">sim = RolloutSimulator()
-r = simulate(sim, m, p)</code></pre><p>More inputs, such as a belief updater, initial state, initial belief, etc. may be specified as arguments to <a href="../api/#POMDPs.simulate"><code>simulate</code></a>. See the docstring for <a href="../api/#POMDPs.simulate"><code>simulate</code></a> and the appropriate &quot;Input&quot; sections in the <a href="../simulation/#Simulation-Standard">Simulation Standard</a> page for more information.</p><p>More examples can be found in the <a href="../example_simulations/#Simulations-Examples">Simulations Examples</a> section. A variety of simulators that return more information and interact in different ways can be found in <a href="../POMDPTools/#pomdptools_section">POMDPTools</a>.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../simulation/">« Simulation Standard</a><a class="docs-footer-nextpage" href="../policy_interaction/">Interacting with Policies »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+r = simulate(sim, m, p)</code></pre><p>More inputs, such as a belief updater, initial state, initial belief, etc. may be specified as arguments to <a href="../api/#POMDPs.simulate"><code>simulate</code></a>. See the docstring for <a href="../api/#POMDPs.simulate"><code>simulate</code></a> and the appropriate &quot;Input&quot; sections in the <a href="../simulation/#Simulation-Standard">Simulation Standard</a> page for more information.</p><p>More examples can be found in the <a href="../example_simulations/#Simulations-Examples">Simulations Examples</a> section. A variety of simulators that return more information and interact in different ways can be found in <a href="../POMDPTools/#pomdptools_section">POMDPTools</a>.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../simulation/">« Simulation Standard</a><a class="docs-footer-nextpage" href="../policy_interaction/">Interacting with Policies »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/simulation/index.html b/dev/simulation/index.html
index cd8f1738..86de561c 100644
--- a/dev/simulation/index.html
+++ b/dev/simulation/index.html
@@ -21,4 +21,4 @@
     d *= discount(mdp)
 end</code></pre><p>In terms of the explicit interface, the <a href="../api/#POMDPs.@gen"><code>@gen</code></a> macro above expands to the equivalent of:</p><pre><code class="language-julia hljs">    sp = rand(transition(pomdp, s, a))
     r = reward(pomdp, s, a, sp)
-    s = sp</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../def_updater/">« Defining a Belief Updater</a><a class="docs-footer-nextpage" href="../run_simulation/">Running Simulations »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:14">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+    s = sp</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../def_updater/">« Defining a Belief Updater</a><a class="docs-footer-nextpage" href="../run_simulation/">Running Simulations »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.5.0 on <span class="colophon-date" title="Friday 12 July 2024 21:57">Friday 12 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>

Row	policy	mean	ci
	String?	Float64	Float64
1	sarsop	-14.6264	1.81814
2	pomcp	-18.6904	1.57649
3	heuristic	-15.4895	1.96535
4	random	-30.4201	2.64208