[ENV]
;FILE = environments.mtd_web_apps.env
FILE = environments.mtd_web_apps_stochastic.env

[HP]
; Epsilon for Exploration
EPS_D = 0.15
EPS_A = 0.15

; Discount factors
; GAMMA = GAMMA_D = GAMMA_A
GAMMA = 0.8

; Learning rate
ALPHA = 0.06

; Episodes
EPISODES = 101
STEPS_PER_EPISODE = 40

; Number of trails to plot rewards with variance
NUM_TRIALS = 6