source ~/PB2/pebenv/bin/activate

python train_PEBBLE.py \
    env=PointMaze \
    experiment=PEBBLE-cam \
	double_q_critic.params.hidden_dim=64 \
	double_q_critic.params.hidden_depth=2 \
	diag_gaussian_actor.params.hidden_dim=64 \
	diag_gaussian_actor.params.hidden_depth=2 \
	agent.params.actor_lr=0.0005 \
	agent.params.critic_lr=0.0005 \
	gradient_update=1 \
	activation=tanh \
	num_unsup_steps=400 \
	num_train_steps=80000 \
	num_interact=10000 \
	max_feedback=20 \
	reward_batch=4 \
	reward_update=2000 \
	teacher_beta=-1 \
	teacher_gamma=1 \
	teacher_eps_mistake=0 \
	teacher_eps_skip=0 \
	teacher_eps_equal=$4 \
	segment=50 \
    wandb=true \
	device='cuda' \
    seed=$1 \
    feed_type=0 \