agent_cls: skyrl_agent.agents.react.ReActAgent

task: skyrl_agent.tasks.general_react.utils.GeneralReactTask

tools: ["finish", "faiss_search"]


data:
  data_source_key: data_source

generator:
  infer_backend: openai_server
  backend_config: 
    model_name: Qwen/Qwen3-32B
    api_url: http://localhost:8000
    model_max_len: 40960
  num_trajectories: 1
  max_iterations: 30
  max_prompt_length: 32768
  sampling_params:
    temperature: 0.5
    top_p: 0.95
    max_tokens: 32768
  val_config:
    num_trajectories: 1
    sampling_params:
      temperature: 1
      top_p: 0.95
      max_tokens: 32768
  remove_think_tokens: false
  vision_is_active: false
  qwen3_enable_thinking: true
  qwen3_acc_thinking: true
  early_step_threshold: 7
  enable_turn_reminder: true

dispatcher:
  type: async_batch
  scheduler: naive
  max_parallel_agents: 1
  max_eval_parallel_agents: 1

