batch_size: 32
checkpoint_dir: null
checkpoint_freq: 1000
checkpoint_path: null
checkpoints_dir: null
discount_factors:
- 0.85
distance_to_receptacle_map_scale: 0.25
env_name: large_tunnels
experiment_name: lifting_4-large_tunnels-predicted_with_history
exploration_frac: 0.1
final_exploration: 0.01
grad_norm_clipping: 100
inactivity_cutoff_per_robot: 100
intention_channel_encoding: spatial
intention_channel_nonspatial_scale: 0.025
intention_map_encoding: ramp
learning_rate: 0.01
learning_starts_frac: 0.025
lifting_pointless_drop_penalty: 0.25
log_dir: null
logs_dir: null
num_cubes: 20
num_input_channels: 6
obstacle_collision_penalty: 0.25
partial_rewards_scale: 2.0
policy_path: null
random_seed: null
replay_buffer_size: 10000
robot_collision_penalty: 1.0
robot_config:
-   lifting_robot: 4
room_length: 1.0
room_width: 1.0
run_name: null
shortest_path_map_scale: 0.25
show_gui: false
success_reward: 1.0
target_update_freq: 1000
total_timesteps: 160000
train_freq: 4
use_distance_to_receptacle_map: false
use_double_dqn: true
use_egl_renderer: true
use_history_map: true
use_intention_channels: false
use_intention_map: false
use_partial_observations: true
use_predicted_intention: true
use_predicted_intention_frac: 0.9
use_shortest_path_map: true
use_shortest_path_movement: true
use_shortest_path_partial_rewards: true
use_shortest_path_to_receptacle_map: true
weight_decay: 0.0001
