# This config cooperates with the `data2hf` to make the synthesized

data:
  !include base_data_setting.yml
  
environment:
  dotenv_path: .env
  
model:

  # GPTs:
  # - "gpt-3.5-turbo","gpt-4", "gpt-4o"
  # - gpt-4-1106-preview, gpt-4-0125-preview
  # DeepSeek:
  # - deepseek/deepseek-chat
  # Qwen:
  # - qwen2.5-72b-instruct
  # - Qwen2.5-Max
  model_name: &model_name deepseek/deepseek-chat
  model_type: &model_type deepseekAPI

  decompose_step_config:
    model_name: *model_name
    model_type: *model_type
    generation_config: &generation_config
      temperature: 0.1
      top_p: 1.0
      top_k: 0
      n: 1
      max_new_tokens: 2048
      num_beams: 1

  explicit_plan_config: 
    model_name: *model_name
    model_type: *model_type
    generation_config: *generation_config

  skeleton_plan_config:
    model_name: *model_name
    model_type: *model_type
    generation_config: *generation_config

train:
  data_synthetic: 

    # The batch size to be processed 
    batch_size: 20
    # How many batches for one save
    save_interval: 50
    # The settings of the synthetic data
    synthesized_path: examples/LatentPlan/SynthesizedData
    synthesized_name: direct-deepseek-MATH

    # Convert the data to the huggingface format to be uploaded
    # to the website
    # The created files for the latent plans
    hf_train_filename: train.json
    hf_test_filename: test.json

    hf_dataname: RDLab/math-direct-deepseek-plan


logging:
  LiteLLM_log_level: WARNING
  # path where to save, empty for no saving
  checkpoint_path: experiments/checkpoints
  result_path: experiments/results
  logging_path: experiments/loggings
  visualization_path: experiments/visualizations

evaluation:
  

   


