# This benchmark does not work as I thought, please ignore...

using POMDPs, Distributions, IntervalArithmetic
export CupsAndBall

struct CupState 
    ball_location::Int
    phase::Int # peek, pick_ reshuffle, pick, sink
end

@kwdef mutable struct CupsGame <: IPOMDP{String, Int, Int} 
    discount::Float64    = 0.9999
    pickBall::Interval  = [interval(0.01,0.99)]
    init_probs::Vector{Interval}  = [1/3, 1/3, 1/3]
end

POMDPs.states(M::CupsGame) = [
    CupState(1,1), CupState(1,2), CupState(1,3),
    CupState(2,1), CupState(2,2), CupState(2,3),
    CupState(3,1), CupState(3,2), CupState(3,3),
    CupState(0,4)]
POMDPs.statetype(M::CupsGame) = String
POMDPs.stateindex(M::CupsGame, s) = findfirst(states(M) .== s)
POMDPs.actions(M::CupsGame) = [1,2,3] # pick ball
POMDPs.actiontype(M::CupsGame) = Int
POMDPs.actionindex(M::CupsGame, a) = a
POMDPs.observations(M::CupsGame) = [true, false] # observed ball, not observed ball
POMDPs.obstype(M::CupsGame) = Bool
POMDPs.obsindex(M::CupsGame, o) = o ? 1 : 2
POMDPs.discount(M::CupsGame) = M.discount
POMDPs.initialstate(M::CupsGame) = SparseCat(["shuffle_1","shuffle_2","shuffle_3"], M.init_probs)
POMDPs.isterminal(M::CupsGame, s) = s=="sink"


function POMDPs.transition(M::CupsGame, s,a)
    s.phase in [3,4] && return CupState(0,4)
    s.phase == 1 && return CupState(s.ball_location, 2)
    # if s.
    #...



    
end