variables:
  tokenizer_name: EleutherAI/gpt-neox-20b
  max_seq_len: 1024

seed: 1
precision: amp_fp16
max_seq_len: ${variables.max_seq_len}

models:
-
  model_name: mpt_test
  # Tokenizer
  tokenizer:
    name: ${variables.tokenizer_name}
    kwargs:
      model_max_length: ${variables.max_seq_len}
  model:
    name: mpt_causal_lm
    init_device: mixed
    # Set the below model parameters to match the checkpoint specified with load_path
    d_model: 768
    n_heads: 12
    n_layers: 12
    expansion_ratio: 4
    max_seq_len: ${variables.max_seq_len}
    vocab_size: 50368
    attn_config:
      attn_impl: flash

  load_path:  # Add your non-optional Composer checkpoint path here! (must not be empty)

device_eval_batch_size: 16

# FSDP config for model sharding
fsdp_config:
  sharding_strategy: FULL_SHARD
  mixed_precision: FULL
  forward_prefetch: True
  limit_all_gathers: True

icl_tasks:
-
  label: jeopardy
  dataset_uri: eval/local_data/world_knowledge/jeopardy_all.jsonl  # ADD YOUR OWN DATASET URI
  num_fewshot: [0]
  icl_task_type: language_modeling
  continuation_delimiter: "\nAnswer: "  # this separates questions from answers
  has_categories: true
