data:
    name: "MNIST"

federated:
    algorithm: "FedAvg"
    train_client_size: 200 
    eval_client_size: 200
    noniid_ratio: 0.02                # (C_min/C_max) where C_min, C_max are size of the least/most biggest class
    log_frequency: 20               # log after a number of rounds
    num_clients: 10                  # chosen to be 2^k (compatible to MMT structure)
    num_rounds: 100                  # will be overloaded in continual unlearning
    evaluation_strategy: "fixed"    # whether to use fixed dataset or remaining client's test set

model:
    type: "MLP"
    input_size: 784
    hidden: 30
    out_size: 10

local:
    loss: "CrossEntropyLoss"
    optimizer: "SGD"
    num_epochs: 1
    lr: 0.001       # Lessons: smaller LR seems to have less weird observations
    weight_decay: 0.1
    lr_scheduler: null
    train_batch_size: 20
    eval_batch_size: 64
    grad_clip: 10.0

sequential_unlearning:
    order: [0,2,4]

parallel:
    do_parallel: False 
    do_multi_gpus: True
    num_clients_per_device: 8
    