#!/bin/bash

{

# python experiments/train.py environment.num_cities=1000 \
#     memory.num_nodes=1000 \
#     memory.memory_size=20 \
#     num_steps=5400000 \
#     batch_size=8 \
#     num_starting_positions=20 \
#     budget=200 \
#     optimizer.num_gradient_accumulation_steps=800 \
#     optimizer.encoder.lr=0 optimizer.decoder.lr=0 \
#     loss.weight_offset=0.00001 loss.weight_scale=1 \
#     checkpointing.restore_path="checkpoints/tsp/pomo/bs32_ps1_ga2_seed0" \
#     slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.memory.memory_size=20 \
#     slowrl.num_starting_points=20 \
#     slowrl.budget=200

# # FOR TRAINING --> was NOT used to get the current reference checkpoint
# python experiments/train.py environment.num_cities=500 \
#     memory.num_nodes=500 \
#     memory.memory_size=80 \
#     num_steps=5400000 \
#     batch_size=32 \
#     num_starting_positions=30 \
#     budget=200 \
#     optimizer.num_gradient_accumulation_steps=400 \
#     optimizer.encoder.lr=0.00001 optimizer.decoder.lr=0.00001 \
#     optimizer.memory.lr=0.0004 \
#     rollout.policy.temperature=1 \
#     init_mem_mha_scale=1 \
#     loss.sp_spec=false \
#     loss.weight_offset=0.0000001 loss.weight_scale=1 \
#     checkpointing.restore_path="checkpoints/tsp/memo/ms80_puf200_bs32_ps1_ga400_seed0/" \
#     networks.decoder.memory_processing.mlp.num_layers=2 \
#     networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.environment.num_cities=500 \
#     slowrl.memory.num_nodes=500 \
#     slowrl.memory.memory_size=80 \
#     slowrl.num_starting_points=40 \
#     slowrl.budget=200 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     validation.networks.decoder.memory_processing.mlp.num_layers=2 \
#     validation.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     networks.encoder.query_chunk_size=250 \
#     networks.decoder.query_chunk_size=500 \
#     networks.decoder.key_chunk_size=500 \
#     validation.networks.encoder.query_chunk_size=250 \
#     validation.networks.decoder.query_chunk_size=500 \
#     validation.networks.decoder.key_chunk_size=500 \
#     slowrl.networks.encoder.query_chunk_size=250 \
#     slowrl.networks.decoder.query_chunk_size=500 \
#     slowrl.networks.decoder.key_chunk_size=500 \
#     logger.neptune.name="test loss" \

#     ## checkpointing.restore_path="checkpoints/tsp/pomo/bs64_ps1_ga1_seed0" \

# # NOW EXPERIMENTING A BIT WITH SLOWRL RUNS
# python experiments/slowrl_validate.py \
#     slowrl.environment.num_cities=500 \
#     slowrl.memory.num_nodes=500 \
#     slowrl.num_starting_points=100 \
#     slowrl.instances_batch_size=8 \
#     slowrl.problems.load_problem=false \
#     slowrl.problems.num_problems=64 \
#     slowrl.memory.memory_size=100 \
#     slowrl.budget=400 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms80_puf200_bs32_ps1_ga400_seed0/" \
#     slowrl.rollout.policy.temperature=0.8 \
#     slowrl.networks.encoder.query_chunk_size=250 \
#     slowrl.networks.decoder.query_chunk_size=500 \
#     slowrl.networks.decoder.key_chunk_size=500 \


# # checking the logits in slowrl
python experiments/slowrl_validate.py \
    slowrl.environment.num_cities=100 \
    slowrl.memory.num_nodes=100 \
    slowrl.num_starting_points=20 \
    slowrl.instances_batch_size=1 \
    slowrl.problems.load_problem=false \
    slowrl.problems.num_problems=8 \
    slowrl.memory.memory_size=40 \
    slowrl.budget=40 \
    slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
    slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
    slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs64_ps1_ga200_seed0/" \
    slowrl.rollout.policy.temperature=1 \
    slowrl.networks.encoder.query_chunk_size=250 \
    slowrl.networks.decoder.query_chunk_size=500 \
    slowrl.networks.decoder.key_chunk_size=500 \

# python experiments/slowrl_validate.py \
#     slowrl.environment.num_cities=500 \
#     slowrl.memory.num_nodes=500 \
#     slowrl.num_starting_points=100 \
#     slowrl.instances_batch_size=8 \
#     slowrl.problems.load_problem=false \
#     slowrl.problems.num_problems=64 \
#     slowrl.memory.memory_size=80 \
#     slowrl.budget=400 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms80_puf200_bs32_ps1_ga400_seed0/" \
#     slowrl.rollout.policy.temperature=1 \
#     slowrl.networks.encoder.query_chunk_size=250 \
#     slowrl.networks.decoder.query_chunk_size=500 \
#     slowrl.networks.decoder.key_chunk_size=500 \

# python experiments/slowrl_validate.py \
#     slowrl.environment.num_cities=500 \
#     slowrl.memory.num_nodes=500 \
#     slowrl.num_starting_points=100 \
#     slowrl.instances_batch_size=8 \
#     slowrl.problems.load_problem=false \
#     slowrl.problems.num_problems=64 \
#     slowrl.memory.memory_size=40 \
#     slowrl.budget=200 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs32_ps1_ga400_seed0/" \
#     slowrl.rollout.policy.temperature=1 \
#     slowrl.networks.encoder.query_chunk_size=250 \
#     slowrl.networks.decoder.query_chunk_size=500 \
#     slowrl.networks.decoder.key_chunk_size=500 \

# python experiments/slowrl_validate.py \
#     slowrl.environment.num_cities=500 \
#     slowrl.memory.num_nodes=500 \
#     slowrl.num_starting_points=100 \
#     slowrl.instances_batch_size=8 \
#     slowrl.problems.load_problem=false \
#     slowrl.problems.num_problems=64 \
#     slowrl.memory.memory_size=40 \
#     slowrl.budget=100 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs32_ps1_ga400_seed0/" \
#     slowrl.rollout.policy.temperature=1 \
#     slowrl.networks.encoder.query_chunk_size=250 \
#     slowrl.networks.decoder.query_chunk_size=500 \
#     slowrl.networks.decoder.key_chunk_size=500 \

# python experiments/slowrl_validate.py \
#     slowrl.environment.num_cities=500 \
#     slowrl.memory.num_nodes=500 \
#     slowrl.num_starting_points=100 \
#     slowrl.instances_batch_size=8 \
#     slowrl.problems.load_problem=false \
#     slowrl.problems.num_problems=64 \
#     slowrl.memory.memory_size=40 \
#     slowrl.budget=400 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs32_ps1_ga400_seed0/" \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.networks.encoder.query_chunk_size=250 \
#     slowrl.networks.decoder.query_chunk_size=500 \
#     slowrl.networks.decoder.key_chunk_size=500 \

# python experiments/slowrl_validate.py \
#     slowrl.environment.num_cities=500 \
#     slowrl.memory.num_nodes=500 \
#     slowrl.num_starting_points=100 \
#     slowrl.instances_batch_size=8 \
#     slowrl.problems.load_problem=false \
#     slowrl.problems.num_problems=64 \
#     slowrl.memory.memory_size=80 \
#     slowrl.budget=400 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs32_ps1_ga400_seed0/" \
#     slowrl.rollout.policy.temperature=1 \
#     slowrl.networks.encoder.query_chunk_size=250 \
#     slowrl.networks.decoder.query_chunk_size=500 \
#     slowrl.networks.decoder.key_chunk_size=500 \



# FOR SLOWRL
# python experiments/slowrl_validate.py eas.environment.num_cities=1000 \
#     eas.num_starting_points=100 \
#     eas.budget=400 \
#     eas.batch_size=8 eas.problems.num_problems=64 \
#     eas.policy.temperature=1.0 \
#     eas.checkpointing.restore_path="checkpoints/tsp/pomo/bs32_ps1_ga2_seed0" \
    


# python experiments/slowrl_validate.py \
#     slowrl.environment.num_cities=1000 \
#     slowrl.num_starting_points=100 \
#     slowrl.instances_batch_size=8 \
#     slowrl.problems.num_problems=64 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.memory.memory_size=20 \
#     slowrl.budget=400 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=4 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=64 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms20_puf200_bs8_ps1_ga800_seed0/" \
#     slowrl.rollout.policy.temperature=0.1 \


# python experiments/train.py environment.num_cities=100 \
#     memory.num_nodes=100 \
#     memory.memory_size=40 \
#     num_steps=4500000 \
#     batch_size=64 \
#     num_starting_positions=40 \
#     budget=200 \
#     optimizer.num_gradient_accumulation_steps=200 \
#     loss.weight_offset=0.0000001 loss.weight_scale=1 \
#     checkpointing.restore_path="data/v1_models/tsp/pomo/" \
#     networks.decoder.memory_processing.mlp.num_layers=2 \
#     networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.environment.num_cities=100 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.memory.memory_size=40 \
#     slowrl.num_starting_points=40 \
#     slowrl.budget=200 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.problems.load_problem=true \
#     slowrl.problems.load_path="data/validation/tsp100_test_small_seed1235.pkl" \
#     slowrl.instances_batch_size=64 \
#     validation.networks.decoder.memory_processing.mlp.num_layers=2 \
#     validation.networks.decoder.memory_processing.mlp.hidden_size=8 \


# python experiments/train.py environment.num_cities=100 \
#     memory.num_nodes=100 \
#     memory.memory_size=40 \
#     num_steps=4500000 \
#     batch_size=64 \
#     num_starting_positions=40 \
#     budget=400 \
#     optimizer.num_gradient_accumulation_steps=400 \
#     loss.weight_offset=0.0000001 loss.weight_scale=1 \
#     checkpointing.restore_path="data/v1_models/tsp/pomo/" \
#     networks.decoder.memory_processing.mlp.num_layers=2 \
#     networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.environment.num_cities=100 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.memory.memory_size=40 \
#     slowrl.num_starting_points=40 \
#     slowrl.budget=400 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.problems.load_problem=true \
#     slowrl.problems.load_path="data/validation/tsp100_test_small_seed1235.pkl" \
#     slowrl.instances_batch_size=64 \
#     validation.networks.decoder.memory_processing.mlp.num_layers=2 \
#     validation.networks.decoder.memory_processing.mlp.hidden_size=8 \

# python experiments/train.py environment.num_cities=100 \
#     memory.num_nodes=100 \
#     memory.memory_size=40 \
#     num_steps=4500000 \
#     batch_size=64 \
#     num_starting_positions=40 \
#     budget=800 \
#     optimizer.num_gradient_accumulation_steps=800 \
#     loss.weight_offset=0.0000001 loss.weight_scale=1 \
#     checkpointing.restore_path="data/v1_models/tsp/pomo/" \
#     networks.decoder.memory_processing.mlp.num_layers=2 \
#     networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.environment.num_cities=100 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.memory.memory_size=40 \
#     slowrl.num_starting_points=40 \
#     slowrl.budget=400 \
#     slowrl.networks.decoder.memory_processing.mlp.num_layers=2 \
#     slowrl.networks.decoder.memory_processing.mlp.hidden_size=8 \
#     slowrl.problems.load_problem=true \
#     slowrl.problems.load_path="data/validation/tsp100_test_small_seed1235.pkl" \
#     slowrl.instances_batch_size=64 \
#     validation.networks.decoder.memory_processing.mlp.num_layers=2 \
#     validation.networks.decoder.memory_processing.mlp.hidden_size=8 \


# python experiments/train.py environment.num_cities=1000 \
#     memory.num_nodes=1000 \
#     memory.memory_size=80 \
#     num_steps=4800000 \
#     batch_size=8 \
#     num_starting_positions=5 \
#     optimizer.num_gradient_accumulation_steps=800 \
#     loss.weight_offset=1 loss.weight_scale=1 \
#     checkpointing.restore_path="checkpoints/tsp/pomo/bs16_ps1_ga2_seed0" \
#     slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.memory.memory_size=80

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.num_starting_points=5 \
#     slowrl.budget=200 \
#     slowrl.pop_size=1 \
#     slowrl.batch_size=8 slowrl.problems.num_problems=64 \
#     slowrl.rollout.policy.temperature=1 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs8_ps1_ga800_seed0"

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.num_starting_points=5 \
#     slowrl.budget=200 \
#     slowrl.pop_size=1 \
#     slowrl.batch_size=8 slowrl.problems.num_problems=64 \
#     slowrl.rollout.policy.temperature=0.3 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs8_ps1_ga800_seed0"



# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.num_starting_points=20 \
#     slowrl.budget=3000 \
#     slowrl.pop_size=1 \
#     slowrl.batch_size=8 slowrl.problems.num_problems=64 \
#     slowrl.rollout.policy.temperature=0.5 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs8_ps1_ga800_seed0"

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.num_starting_points=20 \
#     slowrl.budget=3000 \
#     slowrl.pop_size=1 \
#     slowrl.batch_size=8 slowrl.problems.num_problems=64 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs8_ps1_ga800_seed0"

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.num_starting_points=20 \
#     slowrl.budget=3000 \
#     slowrl.pop_size=1 \
#     slowrl.batch_size=8 slowrl.problems.num_problems=64 \
#     slowrl.rollout.policy.temperature=1 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs8_ps1_ga800_seed0"

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.num_starting_points=20 \
#     slowrl.budget=3000 \
#     slowrl.pop_size=1 \
#     slowrl.batch_size=8 slowrl.problems.num_problems=64 \
#     slowrl.rollout.policy.temperature=0.05 \
#     slowrl.checkpointing.restore_path="checkpoints/tsp/memo/ms40_puf200_bs8_ps1_ga800_seed0"



# python experiments/train.py environment.num_cities=1000 \
#     memory.num_nodes=1000 \
#     num_steps=4800000 \
#     batch_size=8 \
#     num_starting_positions=5 \
#     optimizer.num_gradient_accumulation_steps=800 \
#     loss.weight_offset=2 loss.weight_scale=5 \
#     checkpointing.restore_path="checkpoints/tsp/pomo/bs16_ps1_ga2_seed0" \
#     slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000

# python experiments/train.py environment.num_cities=1000 \
#     memory.num_nodes=1000 \
#     num_steps=4800000 \
#     batch_size=8 \
#     num_starting_positions=5 \
#     optimizer.num_gradient_accumulation_steps=800 \
#     loss.weight_offset=5 loss.weight_scale=5 \
#     checkpointing.restore_path="checkpoints/tsp/pomo/bs16_ps1_ga2_seed0" \
#     slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000

# python experiments/train.py environment.num_cities=1000 \
#     memory.num_nodes=1000 \
#     num_steps=4800000 \
#     batch_size=8 \
#     num_starting_positions=5 \
#     optimizer.num_gradient_accumulation_steps=800 \
#     loss.weight_offset=5 loss.weight_scale=5 \
#     loss.sp_spec=true \
#     checkpointing.restore_path="checkpoints/tsp/pomo/bs16_ps1_ga2_seed0" \
#     slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.memory.num_nodes=1000 \
#     slowrl.num_starting_points=10 \
#     slowrl.pop_size=1 \
#     slowrl.batch_size=1 slowrl.problems.num_problems=8 \
#     slowrl.rollout.policy.temperature=0.1
#     # slowrl.rollout.policy.temperature=0.001

# python experiments/slowrl_validate.py slowrl.environment.num_cities=1000 \
#     slowrl.num_starting_points=100 \
#     slowrl.pop_batch=16 \
#     slowrl.batch_size=1 slowrl.problems.num_problems=64 \
#     slowrl.rollout.policy.temperature=0.001


# python experiments/slowrl_validate.py slowrl.num_starting_points=20 slowrl.batch_size=2 slowrl.problems.num_problems=512

# python experiments/slowrl_validate.py slowrl.memory.memory_size=20
    # slowrl.environment.num_cities=200 slowrl.memory.num_nodes=200 \
# python experiments/slowrl_validate.py slowrl.num_starting_points=10 slowrl.problems.num_problems=256


# # budget 200
# python experiments/slowrl_validate.py slowrl.environment.num_cities=100 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.budget=200

# python experiments/slowrl_validate.py slowrl.environment.num_cities=150 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=150 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=200

# python experiments/slowrl_validate.py slowrl.environment.num_cities=200 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=200 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=200


# # budget 400
# python experiments/slowrl_validate.py slowrl.environment.num_cities=100 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.budget=400

# python experiments/slowrl_validate.py slowrl.environment.num_cities=150 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=150 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=400

# python experiments/slowrl_validate.py slowrl.environment.num_cities=200 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=200 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=400


# # budget 600
# python experiments/slowrl_validate.py slowrl.environment.num_cities=100 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.budget=600

# python experiments/slowrl_validate.py slowrl.environment.num_cities=150 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=150 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=600

# python experiments/slowrl_validate.py slowrl.environment.num_cities=200 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=200 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=600


# # budget 800
# python experiments/slowrl_validate.py slowrl.environment.num_cities=100 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.budget=800

# python experiments/slowrl_validate.py slowrl.environment.num_cities=150 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=150 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=800

# python experiments/slowrl_validate.py slowrl.environment.num_cities=200 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=200 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=800


# # budget 1600
# python experiments/slowrl_validate.py slowrl.environment.num_cities=100 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=100 \
#     slowrl.budget=1600

# python experiments/slowrl_validate.py slowrl.environment.num_cities=150 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=150 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=1600

# python experiments/slowrl_validate.py slowrl.environment.num_cities=200 \
#     slowrl.problems.load_problem=false slowrl.problems.num_problems=512 \
#     slowrl.memory.num_nodes=200 \
#     slowrl.rollout.policy.temperature=0.1 \
#     slowrl.budget=1600

}

