{
    "bandit_choice": "SequentialHalving",
    "T": 50,
    "LLM_choice": "WhiteBox_Llama3", 
    "method": "default",
    "few_shot": false,
    "num_examples": 2,
    "reward_method_train": ["rouge", "brevity"],
    "reward_method_eval": ["rouge", "brevity"],
    "use_examples": false, 
    "num_prompts_examples": 5, 
    "num_examples_per_prompt": 2,
    "use_rephrases": true, 
    "num_prompts_rephrases": 10, 
    "task": "xsum",
    "num_eval_samples": 300
}