In [1]:
using POMDPModels
using POMCP
import POMDPs
import POMDPToolbox: PreviousObservationUpdater
import POMCP.init_V
import POMDPs.action
problem = POMDPModels.BabyPOMDP(-5, -10)
rng = MersenneTwister(1)
solver = POMCPSolver(estimate_value=RolloutEstimator(POMDPModels.FeedWhenCrying()),
eps=0.01,
c=10.0,
tree_queries=20,
rng=rng,
node_belief_updater=POMDPs.updater(problem))
policy = POMDPs.solve(solver, problem)
b = RootNode(0, POMDPModels.BoolDistribution(0.0), Dict{Any,POMCP.ActNode}())
a = action(policy, b)
Out[1]:
In [2]:
# click on the nodes to expand them
POMCPTreeVisualizer(b)
Out[2]:
In [ ]: