train: lm1b
valid: lm1b
tokenizer_name_or_path: gpt2
cache_dir: data
wrap: True
streaming: False
