Commit d8733c36 authored by Steven Cordwell's avatar Steven Cordwell
Browse files

finish docstring example of PolicyIterationModified

parent 4bc83923
...@@ -778,9 +778,9 @@ class PolicyIterationModified(PolicyIteration): ...@@ -778,9 +778,9 @@ class PolicyIterationModified(PolicyIteration):
>>> pim = mdptoolbox.mdp.PolicyIterationModified(P, R, 0.9) >>> pim = mdptoolbox.mdp.PolicyIterationModified(P, R, 0.9)
>>> pim.run() >>> pim.run()
>>> pim.policy >>> pim.policy
FIXME (0, 0, 0)
>>> pim.V >>> pim.V
FIXME (21.81408652334702, 25.054086523347017, 29.054086523347017)
""" """
...@@ -812,7 +812,7 @@ class PolicyIterationModified(PolicyIteration): ...@@ -812,7 +812,7 @@ class PolicyIterationModified(PolicyIteration):
self.V = zeros((self.S, 1)) self.V = zeros((self.S, 1))
else: else:
Rmin = min(R.min() for R in self.R) Rmin = min(R.min() for R in self.R)
self.V = 1 / (1 - discount) * Rmin * ones((self.S,)) self.V = 1 / (1 - self.discount) * Rmin * ones((self.S,))
# Call the iteration method # Call the iteration method
#self.run() #self.run()
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment