api_settings:
  openai_chat_model: 'gpt-4-0125-preview'
  openai_api_key: 'your-openai-api-key'
  base_url: 'your-openai-base-url'  # Optional, can be omitted if not used

  use_azure: False  # Set to True if using Azure OpenAI
  azure_base_url: 'https://your-azure-endpoint'
  azure_api_key: 'your-azure-api-key'
  azure_version: '2023-05-15'
  azure_model: 'gpt-4-0125-preview'

  claude_api_key: 'your-claude-api-key'
  llama3_api_key: 'your-llama3-api-key'

  
generation_settings:
  model_type: "gpt"
  temperature: 0.8
  generation_number: 10
  batch_size: 5
  few_shot_num: 5
  random_example: False
  max_worker: 2
  label_ratio: null
  label_constraint: false

generation_hint:
  dataset_description: "It is a large-scale, multi-task language understanding dataset designed to evaluate language models' capabilities across various language understanding tasks. The dataset questions are presented in a multiple-choice format, each with a question (referred to as \"text\") followed by four options (labeled A, B, C, and D). Each question is associated with a correct answer (\"label\")"
  dataset_name: "MMLU"
  original_dataset_path: /Users/admin/Documents/GitHub/datagen/dataset/MMLU.json
  save_path: /Users/admin/Documents/GitHub/datagen/generated_data
  dataset_constraint: []
  with_label: true
  with_attribute: false
  add_attribute: false
  extra_info_keys: []

efficiency_configuration:
  learn_from_mistake: false
  learn_from_human_feedback: false
  feedback_iteration: 1
  self_reflection: true
  math_eval: false
  truthfulness_eval: false