{
    "env_name": "cheetah-vel-sparse",
    "n_train_tasks": 100,
    "n_eval_tasks": 30,
    "latent_size": 2,
    "env_params": {
        "n_tasks": 130
    }
    ,
    "algo_params": {
        "num_iterations": 5000,
        "num_initial_steps": 256,
        "num_steps_prior": 256,
        "num_steps_posterior": 0,
        "num_extra_rl_steps_posterior": 256,
        "num_evals": 1,
        "num_train_steps_per_itr": 1000,
        "num_steps_per_eval": 128,
        "embedding_batch_size": 64,
        "embedding_mini_batch_size": 64,
        "batch_size": 64,
        "max_path_length": 64,
        "kl_lambda": 1e-3,
        "dump_eval_paths":1,
        "snail": 1,
        "meta_episode_len": 1,
        "num_trajs" : 2,
        "num_trajs_init": 3,
        "policy_lr": 3e-4,
        "qf_lr": 3e-4,
        "vf_lr": 3e-4,
        "context_lr": 3e-4,
        "gradient_from_Q": 1,
        "prediction": 0,
        "reward_scale": 10,
        "eval_deterministic": 1,
        "sparse_rewards": 0,

        "last_reward_only": 0,
        "intrinsic_reward_weight": 0.2,
        "use_kl_div_intrinsic": 0,
        "use_per": 0,
        "alpha": 1,
        "beta": 1,
        "reward_bias": 1e-1,
        "reward_decay": 0.6,
        "intrinsic_reward_decay":1,
        "kl_min_weight":1e-3,
        "pie_hidden_dim":64,
        "flush":100000000,
        "rsample_rate": 1
    },
    "util_params": {
        "base_log_dir":"outputmetacure"

    }
}
