{
    "do_train":true,
    "do_eval":true,
    "overwrite_output_dir": true,
    "load_best_model_at_end": true,
    "model_name_or_path":"gpt2",
    "dataset_name":"wikitext",
    "dataset_config_name":"wikitext-2-raw-v1",
    "per_device_train_batch_size":4,
    "per_device_eval_batch_size":8,
    "num_train_epochs":10,
    "dataloader_num_workers":16,
    "evaluation_strategy":"epoch",
    "save_strategy":"epoch",
    "k":7,
    "n_experts":[1, 2, 3, 4, 5, 6],
    "n_cluster":3,
    "seed":42,
    "use_moe":"CAMex",
    "moe_level":"token",
    "learning_rate":1e-5,
    "output_dir":"./checkpoints/test"
}
