project: ETHER 
entity: near3213 
program: benchmark_wandb_ether.py
command:
        - ${env}
        - /media/kevin/b8ccc6cc-ccc1-469c-aab1-807bad8adb84/DATA/UNI/ETHER-afterSony/ether-sony-env/bin/python
        - ${program}
        - ${args}
method: bayes
metric:
        name: PerEpoch/test/repetition0/comm_round0/sem_grounding_metric_0/s0/Accuracy-any-shape/Mean
        goal: maximize
parameters:
        
        seed:
                values: [10, 20, 30]

        success_threshold:
                values: [0.5]

        config:
                values: [room12x5Objs_miniworld_wandb_benchmark_ETHER+R2D2+RP+SharedObsEncoder_config.yaml, room12x5Objs_miniworld_wandb_benchmark_ETHER+R2D2+RP+BN+SharedObsEncoder_config.yaml]

        language_guided_curiosity:
                values: [False]

        coverage_metric:
                values: [True]

        MiniWorld_entity_visibility_oracle:
                values: [False]

        MiniWorld_entity_visibility_oracle_top_view:
                values: [False]

        use_ETHER:
                values: [True]
        use_THER:
                values: [True]

        use_RP:
                values: [False]
        RP_use_RP:
                values: [True]

        use_ELA:
                values: [False]
        ELA_use_ELA:
                values: [True]

        use_HER:
                values: [False]
        goal_oriented:
                values: [False]

        ETHER_use_ETHER:
                values: [True]

        THER_use_THER:
                values: [True]

        THER_use_THER_predictor_supervised_training:
                values: [False]

        THER_use_THER_predictor_supervised_training_data_collection:
                values: [True]

        ETHER_use_supervised_training:
                values: [False]

        ETHER_rg_sanity_check_compactness_ambiguity_metric:
                values: [False]

        ETHER_rg_shared_architecture:
                values: [False, True]

        ETHER_rg_with_logits_mdl_principle:
                values: [True]

        ETHER_rg_logits_mdl_principle_factor:
                values: [1.0e-3, 1.0e-4]

        ETHER_rg_logits_mdl_principle_accuracy_threshold:
                values: [10.0, 20.0, 40.0, 60.0]

        ETHER_rg_agent_loss_type:
                values: [Impatient+Hinge, Hinge]

        ETHER_use_continuous_feedback:
                values: [False, True]

        ETHER_listener_based_predicated_reward_fn:
                values: [True]

        ETHER_rg_with_semantic_grounding_metric:
                values: [True]
        MiniWorld_symbolic_image:
                values: [True]

        ETHER_rg_homoscedastic_multitasks_loss:
                values: [False]

        ETHER_rg_use_semantic_cooccurrence_grounding:
                values: [True]

        ETHER_rg_semantic_cooccurrence_grounding_lambda:
                values: [1.0e1, 1.0e2, 1.0e3, 1.0e4]

        ETHER_rg_semantic_cooccurrence_grounding_noise_magnitude:
                values: [0.2, 0.1, 0.01, 0.4]

        ETHER_lock_test_storage:
                values: [True]
        ETHER_rg_filter_out_non_unique:
                values: [False]

        ETHER_rg_color_jitter_prob:
                values: [0.0]
        ETHER_rg_gaussian_blur_prob:
                values: [0.0, 0.1, 0.25, 0.5, 0.75, 0.9]

        ETHER_rg_egocentric_prob:
                values: [0.0, 0.1, 0.25, 0.5, 0.75, 0.9]

        ETHER_rg_object_centric_version:
                values: [2]
        ETHER_rg_descriptive_version:
                values: [1]

        ETHER_rg_learning_rate:
                values: [6.25e-5]
        ETHER_rg_weight_decay:
                values: [0.0]

        ETHER_rg_l2_weight_decay:
                values: [0.0]
        ETHER_rg_l1_weight_decay:
                values: [0.0, 0.00001, 0.001, 0.0001]

        ETHER_rg_vocab_size:
                values: [64]
        ETHER_rg_training_period:
                values: [8192, 16384]

        ETHER_rg_object_centric:
                values: [False]
        ETHER_rg_descriptive:
                values: [False, True]
        ETHER_rg_use_curriculum_nbr_distractors:
                values: [False]

        ETHER_rg_nbr_epoch_per_update:
                values: [8, 16, 32, 64]
        ETHER_rg_accuracy_threshold:
                values: [70, 90, 95]

        ETHER_rg_nbr_train_distractors:
                values: [31, 7, 15]
        ETHER_rg_nbr_test_distractors:
                values: [7]

        ETHER_replay_capacity:
                values: [8192]
        ETHER_test_replay_capacity:
                values: [1024]

        ETHER_rg_distractor_sampling:
                values: [uniform, similarity-90]

        RP_use_PER:
                values: [True]

        RP_lock_test_storage:
                values: [False]

        RP_predictor_learning_rate:
                values: [6.25e-5]

        RP_gradient_clip:
                values: [5.0]

        RP_replay_capacity:
                values: [16384]
        RP_min_capacity:
                values: [32]

        RP_predictor_nbr_minibatches:
                values: [4]
        RP_predictor_batch_size:
                values: [256]

        RP_predictor_test_train_split_interval:
                values: [3]
        RP_test_replay_capacity:
                values: [1024]

        RP_test_min_capacity:
                values: [32]
        RP_replay_period:
                values: [1024]

        RP_nbr_training_iteration_per_update:
                values: [8]

        RP_predictor_accuracy_threshold:
                values: [90]

        ELA_rg_sanity_check_compactness_ambiguity_metric:
                values: [False]

        ELA_rg_shared_architecture:
                values: [False]

        ELA_rg_with_logits_mdl_principle:
                values: [True]

        ELA_rg_logits_mdl_principle_factor:
                values: [1.0e-3]

        ELA_rg_logits_mdl_principle_accuracy_threshold:
                values: [10.0]

        ELA_rg_agent_loss_type:
                values: [Impatient+Hinge]

        ELA_rg_use_semantic_cooccurrence_grounding:
                values: [False]

        ELA_rg_semantic_cooccurrence_grounding_lambda:
                values: [1.0]

        ELA_rg_semantic_cooccurrence_grounding_noise_magnitude:
                values: [0.2]

        ELA_lock_test_storage:
                values: [True]

        ELA_rg_with_color_jitter_augmentation:
                values: [False]

        ELA_rg_with_gaussian_blur_augmentation:
                values: [True]

        ELA_rg_egocentric:
                values: [False]

        ELA_rg_object_centric_version:
                values: [2]
        ELA_rg_descriptive_version:
                values: [1]

        ELA_rg_learning_rate:
                values: [6.25e-5]
        ELA_rg_weight_decay:
                values: [0.0]

        ELA_rg_vocab_size:
                values: [64]
        ELA_rg_training_period:
                values: [4096]

        ELA_rg_descriptive:
                values: [False]
        ELA_rg_use_curriculum_nbr_distractors:
                values: [False]

        ELA_rg_nbr_epoch_per_update:
                values: [2]
        ELA_rg_accuracy_threshold:
                values: [90]

        ELA_rg_nbr_train_distractors:
                values: [7]
        ELA_rg_nbr_test_distractors:
                values: [7]

        ELA_replay_capacity:
                values: [8192]
        ELA_test_replay_capacity:
                values: [2048]

        ELA_rg_distractor_sampling:
                values: [uniform]

        ELA_reward_extrinsic_weight:
                values: [0.0]
        ELA_reward_intrinsic_weight:
                values: [1.0]

        ELA_feedbacks_failure_reward:
                values: [-0.1]
        ELA_feedbacks_success_reward:
                values: [1]

        THER_use_PER:
                values: [True]
        THER_observe_achieved_goal:
                values: [False]

        THER_lock_test_storage:
                values: [True]

        THER_feedbacks_failure_reward:
                values: [-1]
        THER_feedbacks_success_reward:
                values: [1]

        THER_episode_length_reward_shaping:
                values: [True]

        THER_replay_capacity:
                values: [1024]
        THER_min_capacity:
                values: [12]

        THER_predictor_nbr_minibatches:
                values: [1]
        THER_predictor_batch_size:
                values: [32]

        THER_predictor_test_train_split_interval:
                values: [5]
        THER_test_replay_capacity:
                values: [256]

        THER_test_min_capacity:
                values: [4]
        THER_replay_period:
                values: [4096]

        THER_train_on_success:
                values: [False]
        THER_nbr_training_iteration_per_update:
                values: [128]

        THER_predict_PADs:
                values: [False]
        THER_predictor_accuracy_threshold:
                values: [0.95]

        THER_predictor_accuracy_safe_to_relabel_threshold:
                values: [0.0]
        THER_filter_predicate_fn:
                values: [False]

        THER_relabel_terminal:
                values: [False]
        THER_filter_out_timed_out_episode:
                values: [False, True]

        THER_train_contrastively:
                values: [False]
        THER_contrastive_training_nbr_neg_examples:
                values: [0]

        THER_timing_out_episode_length_threshold:
                values: [40]

        BabyAI_Bot_action_override:
                values: [False]

        n_step:
                values: [3]
        nbr_actor:
                values: [32]
        eps_greedy_alpha:
                values: [2.0]

        nbr_minibatches:
                values: [1]
        batch_size:
                values: [64]

        min_capacity:
                values: [4e3]
        replay_capacity:
                values: [5e3]
        learning_rate:
                values: [6.25e-5]

        sequence_replay_burn_in_ratio:
                values: [0.5]
        weights_entropy_lambda:
                values: [0.0]

        sequence_replay_unroll_length:
                values: [20]
        sequence_replay_overlap_length:
                values: [10]

        sequence_replay_use_online_states:
                values: [True]
        sequence_replay_use_zero_initial_states:
                values: [False]

        sequence_replay_store_on_terminal:
                values: [False]
        HER_target_clamping:
                values: [False]

        adam_weight_decay:
                values: [0.0]
        ther_adam_weight_decay:
                values: [0.0]

        nbr_training_iteration_per_cycle:
                values: [128]
        nbr_episode_per_cycle:
                values: [16]

        single_pick_episode:
                values: [True]

        time_limit:
                values: [40]
        
        train_observation_budget:
                values: [5.0e4]

 
