environment:
  name: tsp  # Other values: cvrp, knapsack
  params:
    #  CVRP Params (other pairs are <150, 55>, <150, 60>)
    num_nodes: 100
    norm_factor: 50

    # Knapsack Params
    num_items: 100
    total_budget: 25

    # TSP Params (other values are 125, 150)
    num_cities: 100

seed: 0

num_steps: 1000                 # Number of training steps
validation_freq: 500            # Every how many steps validation runs

pop_size: 1                     # Population size (e.g. 1, 4, 8, 16, 32)
num_starting_points: 20         # Number of starting points (must lower or equal than the problem size)
training_method: "all"          # What method is used to train the agents (all, best_one_with_tie_breaking, best_one_without_tie_breaking, anneal_parallel_best)
loss_annealing_steps: 0         # For how many steps the annealing from parallel to best works (only if training_method is anneal_parallel_best)
train_encoder: False            # Whether to train the encoder or keep its parameters frozen

num_problems_training: 64           # Batch size (number of problems for each training step)
minibatch_size_training: 64         # Training is run in minibatches (should be a divisor of num_problems_training)
num_problems_validation: 10000      # Number of problems to run validation on (the set is randomly generated and fixed)
minibatch_size_validation: 1000     # Validation is run in minibatches (should be a divisor of num_problems_validation)
use_augmentation_validation: False  # Whether to use augmentations during validation

save_checkpoint: True           # Whether to save checkpoints
save_best: False                # Whether to save a new checkpoint upon achieving best performance (o.w. save the last one)

load_checkpoint: ""             # Path to a checkpoint to be loaded (empty string -> do not load anything)
load_decoder: False             # Whether to load the decoder(s) from the checkpoint
load_optimizer: False           # Whether to load the optimizers from the checkpoint