base: &base
  exp_name: "transformer-border"
  group: "dump"
  task: "expansion"
  batch_size: 16
  test_batch_size: 8
  epochs: 8
  seed: 42

environments: &env
  gpu_id: 0
  num_workers: 4

gf_base: &gf_base
  <<: *base
  field: "GF31"
  training_size: 1000000
  test_size: 5000
  train_test_split: true
  num_variables: 3
  max_degree: 20   # the exponent tokens are prepared up to this number
  # data_path: "data/expansion/GF31_n=3_deg=4_terms=10_bounds=4_4_4_total=4"
  # data_path: "/software/ais2t/transformer_border_datasets/data/expansion/GF7_n=3_deg=1_terms=10_bounds=4_4_4_total=4"
  data_path: "/software/ais2t/transformer_border_datasets/data/expansion/GF31_n=3_deg=1_terms=10_bounds=4_4_4_total=4"
  aware_of_padding: false
  weight_decay: 0.1

experiments:
  base_k_lt=1:
    <<: *gf_base
    model: "custom_bart"
    embedding_type: "standard"
    position_encoding_type: "learned"
    coeff_encoding: "prefix"
    learning_target: "k-leading-terms"
    monomial_embedding: true
    num_leading_terms: 1
    tags: ["base", 'k_lt=1']

  base_k_lt=3:
    <<: *gf_base
    model: "custom_bart"
    embedding_type: "standard"
    position_encoding_type: "learned"
    coeff_encoding: "prefix"
    learning_target: "k-leading-terms"
    monomial_embedding: true
    num_leading_terms: 3
    tags: ["base", 'k_lt=3']

  base_k_lt=5:
    <<: *gf_base
    model: "custom_bart"
    embedding_type: "standard"
    position_encoding_type: "learned"
    coeff_encoding: "prefix"
    learning_target: "k-leading-terms"
    monomial_embedding: true
    num_leading_terms: 5
    tags: ["base", 'k_lt=5']

  base_k_lt=10:
    <<: *gf_base
    model: "custom_bart"
    embedding_type: "standard"
    position_encoding_type: "learned"
    coeff_encoding: "prefix"
    learning_target: "k-leading-terms"
    monomial_embedding: true
    num_leading_terms: 10
    tags: ["base", 'k_lt=10']


  base_k_lt=20:
    <<: *gf_base
    model: "custom_bart"
    embedding_type: "standard"
    position_encoding_type: "learned"
    coeff_encoding: "prefix"
    learning_target: "k-leading-terms"
    monomial_embedding: true
    num_leading_terms: 20
    tags: ["base", 'k_lt=20']


  skimming_k_lt=1:
    <<: *gf_base
    training_size: 100000
    model: "custom_bart"
    embedding_type: "standard"
    position_encoding_type: "learned"
    coeff_encoding: "prefix"
    learning_target: "k-leading-terms"
    monomial_embedding: true
    train_sample_skimming: true
    num_leading_terms: 1
    tags: ["skimming", 'k_lt=1']

  skimming_k_lt=5:
    <<: *gf_base
    training_size: 100000
    model: "custom_bart"
    embedding_type: "standard"
    position_encoding_type: "learned"
    coeff_encoding: "prefix"
    learning_target: "k-leading-terms"
    monomial_embedding: true
    train_sample_skimming: true
    num_leading_terms: 5
    tags: ["skimming", 'k_lt=5']