{
    "n_layers": 6,
    "model_dim": 256,
    "dropout": 0.25,
    "vocab_size": 33,
    "sequence_length": 82,
    "learning_rate": 0.005,
    "n_max_epochs": 1000,
    "batch_size": 8192,
    "device": "cuda"
}