3, [s0, s1, s2]
3, [e0, e1, e2]
3, [a0, a1, a2]
2, [o0, o1]

29, [pt_0.0.0, pt_0.0.1, pt_0.0.2, pt_0.1.0, pt_0.1.1, pt_0.1.2, pt_0.2.0, pt_0.2.1, pt_0.2.2, pt_1.0.0, pt_1.0.1, pt_1.0.2, pt_1.1.0, pt_1.1.1, pt_1.1.2, pt_1.2.0, pt_1.2.1, pt_1.2.2, pt_2.0.0, pt_2.0.1, pt_2.0.2, pt_2.1.0, pt_2.1.1, pt_2.1.2, pt_2.2.0, pt_2.2.1, pt_2.2.2, pt_1.0, pt_1.1]
[0.75, 0.15, 0.1, 0.0, 0.95, 0.05, 0.95, 0.05, 0.0, 0.75, 0.15, 0.1, 0.0, 0.95, 0.05, 0.95, 0.05, 0.0, 0.0, 0.95, 0.05, 0.95, 0.05, 0.0, 0.75, 0.15, 0.1, 0.6, 0.4]
[0.95, 0.05, 0.0, 0.0, 0.95, 0.05, 0.75, 0.15, 0.1, 0.0, 0.95, 0.05, 0.95, 0.05, 0.0, 0.75, 0.15, 0.1, 0.95, 0.05, 0.0, 0.75, 0.15, 0.1, 0.0, 0.95, 0.05, 0.15, 0.85]
[0.75, 0.15, 0.1, 0.95, 0.05, 0.0, 0.0, 0.95, 0.05, 0.0, 0.95, 0.05, 0.95, 0.05, 0.0, 0.75, 0.15, 0.1, 0.75, 0.15, 0.1, 0.95, 0.05, 0.0, 0.0, 0.95, 0.05, 0.35, 0.65]

# Transition function (s,a,s -> p)
0,0,0 -> pt_0.0.0
0,0,1 -> pt_0.0.1
0,0,2 -> pt_0.0.2
0,1,0 -> pt_0.1.0
0,1,1 -> pt_0.1.1
0,1,2 -> pt_0.1.2
0,2,0 -> pt_0.2.0
0,2,1 -> pt_0.2.1
0,2,2 -> pt_0.2.2
1,0,0 -> pt_1.0.0
1,0,1 -> pt_1.0.1
1,0,2 -> pt_1.0.2
1,1,0 -> pt_1.1.0
1,1,1 -> pt_1.1.1
1,1,2 -> pt_1.1.2
1,2,0 -> pt_1.2.0
1,2,1 -> pt_1.2.1
1,2,2 -> pt_1.2.2
2,0,0 -> pt_2.0.0
2,0,1 -> pt_2.0.1
2,0,2 -> pt_2.0.2
2,1,0 -> pt_2.1.0
2,1,1 -> pt_2.1.1
2,1,2 -> pt_2.1.2
2,2,0 -> pt_2.2.0
2,2,1 -> pt_2.2.1
2,2,2 -> pt_2.2.2

# Observation function (a,s,o -> p)
_,0,0 -> 1
_,1,0 -> pt_1.0
_,1,1 -> pt_1.1
_,2,1 -> 1

# Reward function (s,a -> r)
0,0 -> 0
0,1 -> -5
0,2 -> -5
1,0 -> 5
1,1 -> 0
1,2 -> 0
2,0 -> 10
2,1 -> 5
2,2 -> 5

# Initial beliefs (s -> p)
0 -> 1