
{
    "model" : "VIT",
    "data" : "cifar10",
    "batch_size_train": 100,
    "batch_size_test": 100,
    "act_func": "ReLU",
    "Vw": 1.3,
    "Vb": 0.0,
    "lr": 1e-5,
    "patch_size": 4,
    "hidden_size" : 300,
    "num_hidden_layers": 20,
    "num_attention_heads": 1,
    "intermediate_size": 300, 
    "qkv_bias": False,
    "residual" : False,
    "output_attentions": False,
    "use_faster_attention" : True,
    "seed": 42,
    "max_steps": 10000,
    "max_epochs": 4,
    "accelerator" : "gpu",
    "init" : "Gaussian",
}


