model:
  name: "AutoModelForSequenceClassification"
  args: ["roberta-base"]
  kwargs:
    num_labels: 2
    cache_dir: "./datas/models/roberta-base"
  # trainables: ["^classifier\\..*"]
  trainables: [".*"]

dataset:
  tokenizer_args:
    name: "roberta-base"
    cache_dir: "./datas/tokenizers/roberta-base"
    max_length: 128
    # max_length: 512
  input_columns: ["input_ids", "attention_mask", "labels"]