# This is the configuration file for llms.
OPENAI:
  OPENAI: ""
  API_KEY: ""
  MODEL_NAME: "gpt-4o-mini-2024-07-18"
  EMB_MODEL: "text-embedding-3-small"
  IS_AZURE: False
  temperature: 1.0
  max_tokens: 4096
  seed: 1
  debug_mode: False
DEEPSEEK:
  OPENAI: ""
  API_KEY: ""
  BASE_URL: "https://api.deepseek.com"
  MODEL_NAME: "deepseek-reasoner"
  EMB_MODEL: "text-embedding-3-small"
  IS_AZURE: False
  temperature: 0.0
  max_tokens: 4096
  seed: 1
  debug_mode: False
VLLM:
  OPENAI: ""
  API_KEY: "EMPTY"
  BASE_URL: "http://localhost:8018/v1"
  MODEL_NAME: "Qwen/Qwen2-VL-72B-Instruct"
  EMB_MODEL: "Qwen/Qwen2-VL-72B-Instruct"
  IS_AZURE: False
  temperature: 0.0
  max_tokens: 4096
  seed: 1
  debug_mode: False
OLLAMA:
  OPENAI: ""
  API_KEY: "EMPTY"
  BASE_URL: "http://localhost:11434/v1/"
  MODEL_NAME: "llama3.2-vision"
  EMB_MODEL: "llama3.2-vision"
  IS_AZURE: False
  temperature: 0.0
  max_tokens: 4096
  seed: 1
  debug_mode: False
CLAUDE:
  CLAUDE: ""
  API_KEY: ""
  MODEL_NAME: "claude-3-haiku-20240307"
  temperature: 0.0
  max_tokens: 4096
  seed: 1
  debug_mode: False
  IS_AZURE: False
  USE_SYNC: True
search: 
  SEARCHAPI_API_KEY: "" # for Web Search
algo:
  # whether to share parameter among agents
  share_param: False
  use_full_mode: True
seed:
  # whether to use the specified seed
  seed_specify: True
  # seed
  seed: 1
device:
  # whether to use CUDA
  cuda: True
  # whether to set CUDA deterministic
  cuda_deterministic: True
  # arg to torch.set_num_threads
  torch_threads: 4
train:
  # number of parallel environments for training data collection
  n_rollout_threads: 1
  # number of total training steps
  train_episodes: 100
  # logging interval
  log_interval: 5
  # evaluation interval
  eval_interval: 25
  skill_interval: 20
  # whether to consider the case of truncation when an episode is done
  use_proper_time_limits: True
  debug: True
eval:
  # whether to use evaluation
  use_eval: False
  # number of parallel environments for evaluation
  n_eval_rollout_threads: 1
  # number of episodes per evaluation
  eval_episodes: 2
offline:
  use_offline: False
  refine_tactics: False
  offline_data_type: "h5"
  shuffle: True
  max_buffer_size: 1000
render:
  # whether to use render
  use_render: False
  # number of episodes to render
  render_episodes: 10
logger:
  # logging directory
  log_dir: "./results"
