backend: "torch"

data:
    name: "huggingface:papluca/language-identification@llm"
    root: "huggingface_data/"
    splitter: 'meta' # split data according to the 'category' field
    splits: [0.9,0.05,0.05]
    consistent_label_distribution: True

federated:
    algorithm: "FedAvg"
    train_client_size: 200 
    eval_client_size: 100
    log_frequency: 1   # log after a number of rounds
    num_clients: 3
    num_rounds: 1    # will be overloaded in continual unlearning
    evaluation_strategy: "fixed"   # whether to use fixed dataset or remaining client's test set
    random_seed: 123

huggingface:
    token: null 

model:
    type: "huggingface:openai-community/gpt2"
    out_size: 3

llm:
    tok_len: 512
    fine_tune_config: {
                    "lora_config": {
                        "r": 16,
                        "lora_alpha": 32,
                        "lora_dropout": 0.05,
                        "bias": "none",
                        "task_type": "CAUSAL_LM",
                    },
                    "training_args": {"per_device_train_batch_size": 8, "learning_rate": 0.00001, "logging_steps": 1},
                    "bnb_config": {
                        "load_in_4bit": True,
                        "bnb_4bit_use_double_quant": True,
                        "bnb_4bit_quant_type": "nf4",
                        "bnb_4bit_compute_dtype": "bfloat16",
                    },
                }

dataloader:
    type: "base"


local:
    optimizer: "Adam"
    num_epochs: 1
    lr: 0.00005
    weight_decay: 0.01
    lr_scheduler: null
    train_batch_size: 128
    eval_batch_size: 128
    grad_clip: 1.0

sequential_unlearning:
    order: [0, 2]

parallel:
    do_parallel: True       # parallelism happens at sub-fl level
    do_multi_gpus: True 
    num_clients_per_device: 5