Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
Zahra Rajabi
pymdptoolbox
Commits
d273f3a6
Commit
d273f3a6
authored
May 21, 2013
by
Steven Cordwell
Browse files
move all sqlite code to mdpsql.py and remove SQLite from class names
parent
7857e073
Changes
2
Hide whitespace changes
Inline
Side-by-side
mdp.py
View file @
d273f3a6
...
...
@@ -92,16 +92,13 @@ http://www.inra.fr/mia/T/MDPtoolbox/.
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.
import
sqlite3
import
os
from
math
import
ceil
,
log
,
sqrt
from
random
import
random
from
time
import
time
from
numpy
import
absolute
,
arange
,
array
,
diag
,
empty
,
matrix
,
mean
,
mod
from
numpy
import
absolute
,
array
,
diag
,
empty
,
matrix
,
mean
,
mod
from
numpy
import
multiply
,
ndarray
,
ones
,
zeros
from
numpy.random
import
permutation
,
rand
,
randint
from
numpy.random
import
rand
,
randint
from
scipy.sparse
import
csr_matrix
as
sparse
# __all__ = ["check", "checkSquareStochastic"]
...
...
@@ -496,7 +493,7 @@ def exampleForest(S=3, r1=4, r2=2, p=0.1):
# we want to return the generated transition and reward matrices
return
(
P
,
R
)
def
exampleRand
(
S
,
A
,
is_sparse
=
False
,
is_sqlite
=
False
,
mask
=
None
):
def
exampleRand
(
S
,
A
,
is_sparse
=
False
,
mask
=
None
):
"""Generate a random Markov Decision Process.
Parameters
...
...
@@ -543,44 +540,7 @@ def exampleRand(S, A, is_sparse=False, is_sqlite=False, mask=None):
except
AttributeError
:
raise
TypeError
(
mdperr
[
"mask_numpy"
])
# generate the transition and reward matrices based on S, A and mask
if
is_sqlite
:
# to be usefully represented as a sparse matrix, the number of nonzero
# entries should be less than 1/3 of dimesion of the matrix, so (SxS)/3
db
=
"MDP.db"
if
os
.
path
.
exists
(
db
):
raise
StandardError
(
"Database already exists, not overwriting. "
\
"Delete '"
+
db
+
"' if you want to continue."
)
else
:
conn
=
sqlite3
.
connect
(
db
)
with
conn
:
c
=
conn
.
cursor
()
cmd
=
'''
CREATE TABLE info (name TEXT, value INTEGER);
INSERT INTO info VALUES('states', %s);
INSERT INTO info VALUES('actions', %s);'''
%
(
S
,
A
)
c
.
executescript
(
cmd
)
for
a
in
range
(
A
):
cmd
=
'''
CREATE TABLE transition%s (row INTEGER, col INTEGER, prob REAL);
CREATE TABLE reward%s (state INTEGER PRIMARY KEY ASC, val REAL);'''
%
(
a
,
a
)
c
.
executescript
(
cmd
)
cmd
=
"INSERT INTO reward%s(val) VALUES(?)"
%
a
c
.
executemany
(
cmd
,
zip
(
rand
(
S
).
tolist
()))
for
s
in
xrange
(
S
):
n
=
randint
(
1
,
S
//
3
)
# timeit [90894] * 20330
# ==> 10000 loops, best of 3: 141 us per loop
# timeit (90894*np.ones(20330, dtype=int)).tolist()
# ==> 1000 loops, best of 3: 548 us per loop
col
=
(
permutation
(
arange
(
S
))[
0
:
n
]).
tolist
()
val
=
rand
(
n
)
val
=
(
val
/
val
.
sum
()).
tolist
()
cmd
=
"INSERT INTO transition%s VALUES(?, ?, ?)"
%
a
c
.
executemany
(
cmd
,
zip
([
s
]
*
n
,
col
,
val
))
cmd
=
"CREATE UNIQUE INDEX Pidx%s ON transition%s (row, col);"
%
(
a
,
a
)
c
.
execute
(
cmd
)
return
elif
is_sparse
:
if
is_sparse
:
# definition of transition matrix : square stochastic matrix
P
=
empty
(
A
,
dtype
=
object
)
# definition of reward matrix (values between -1 and +1)
...
...
mdpsql.py
View file @
d273f3a6
# -*- coding: utf-8 -*-
import
os
import
sqlite3
from
time
import
time
class
MDPSQLite
(
object
):
from
numpy
import
arange
from
numpy.random
import
permutation
,
rand
,
randint
def
exampleRand
(
S
,
A
):
# to be usefully represented as a sparse matrix, the number of nonzero
# entries should be less than 1/3 of dimesion of the matrix, so (SxS)/3
db
=
"MDP-%sx%s.db"
%
(
S
,
A
)
if
os
.
path
.
exists
(
db
):
os
.
remove
(
db
)
conn
=
sqlite3
.
connect
(
db
)
with
conn
:
c
=
conn
.
cursor
()
cmd
=
'''
CREATE TABLE info (name TEXT, value INTEGER);
INSERT INTO info VALUES('states', %s);
INSERT INTO info VALUES('actions', %s);'''
%
(
S
,
A
)
c
.
executescript
(
cmd
)
for
a
in
range
(
A
):
cmd
=
'''
CREATE TABLE transition%s (row INTEGER, col INTEGER, prob REAL);
CREATE TABLE reward%s (state INTEGER PRIMARY KEY ASC, val REAL);'''
%
(
a
,
a
)
c
.
executescript
(
cmd
)
cmd
=
"INSERT INTO reward%s(val) VALUES(?)"
%
a
c
.
executemany
(
cmd
,
zip
(
rand
(
S
).
tolist
()))
for
s
in
xrange
(
S
):
n
=
randint
(
1
,
S
//
3
)
# timeit [90894] * 20330
# ==> 10000 loops, best of 3: 141 us per loop
# timeit (90894*np.ones(20330, dtype=int)).tolist()
# ==> 1000 loops, best of 3: 548 us per loop
col
=
(
permutation
(
arange
(
S
))[
0
:
n
]).
tolist
()
val
=
rand
(
n
)
val
=
(
val
/
val
.
sum
()).
tolist
()
cmd
=
"INSERT INTO transition%s VALUES(?, ?, ?)"
%
a
c
.
executemany
(
cmd
,
zip
([
s
]
*
n
,
col
,
val
))
cmd
=
"CREATE UNIQUE INDEX Pidx%s ON transition%s (row, col);"
%
(
a
,
a
)
c
.
execute
(
cmd
)
return
class
MDP
(
object
):
""""""
def
__init__
(
self
,
db
,
discount
,
epsilon
,
max_iter
,
initial_V
=
0
):
...
...
@@ -166,12 +206,12 @@ class MDPSQLite(object):
self
.
_cur
.
executemany
(
cmd
,
zip
(
state
,
action
,
value
))
self
.
_conn
.
commit
()
class
ValueIteration
SQLite
(
MDPSQLite
):
class
ValueIteration
(
MDP
):
""""""
def
__init__
(
self
,
db
,
discount
,
epsilon
=
0.01
,
max_iter
=
1000
,
initial_value
=
0
):
MDP
SQLite
.
__init__
(
self
,
db
,
discount
,
epsilon
,
max_iter
,
initial_value
)
MDP
.
__init__
(
self
,
db
,
discount
,
epsilon
,
max_iter
,
initial_value
)
if
self
.
discount
<
1
:
self
.
thresh
=
epsilon
*
(
1
-
self
.
discount
)
/
self
.
discount
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment