{
    "env_name": "reacher-goal-sparse",
    "n_train_tasks": 80,
    "n_eval_tasks": 20,
    "env_params": {
        "n_tasks": 100
    }
    ,
    "algo_params": {
        "num_iterations": 360,
        "num_initial_steps": 128,
        "num_tasks_sample": 10,
        "num_steps_prior": 128,
        "num_steps_posterior": 128,
        "num_extra_rl_steps_posterior": 128,
        "num_train_steps_per_itr": 1000,
        "num_steps_per_eval": 128,
        "embedding_batch_size": 64,
        "embedding_mini_batch_size": 64,
        "batch_size": 64,
        "max_path_length": 64,
        "discount": 0.90,
        "reward_scale": 100.0,
        "sparse_rewards": 0,
        "kl_lambda": 1e-0,
        "dump_eval_paths":1,
        "snail": 1,
        "meta_episode_len": 1,
        "num_trajs" : 2,
        "num_trajs_init": 2,
        "use_all_trajs": 1,
        "last_reward_only": 0,
        "intrinsic_reward_weight": 0.1,
        "use_kl_div_intrinsic": 0,
        "use_per": 0,
        "alpha": 1,
        "beta": 1,
        "reward_bias": 1e-1,
        "reward_decay": 0.6,
        "eval_deterministic":1,
        "gradient_from_Q": 1,
        "prediction_reward_scale": 10,
        "rsample_rate": 2,
        "rsample_rate_eval": 2
    },
    "util_params": {
        "base_log_dir":"outputmetacure"

    }
}
