learning_rate = 0.0005 # was 0.001
num_epochs = 200
adapter_hidden_dim = 512 # Was 512
batch_size = 32
save_best_model = True
save_every_X_model = 5
