
python simple-evals/scripts/collect_results.py \
    --models o3,\
react-o3-1,react-o3-5,react-o3-10,\
search-o1-tool-o3-1,search-o1-tool-o3-5,search-o1-tool-o3-10,search-o1-tool-o3-25,search-o1-tool-o3-50,search-o1-tool-o3-100,\
hf-odr-o3,gpt-researcher-o3,\
drreact-o3-10,drreact-o3-25,drreact-o3-50,drreact-o3-100,\
drreact-summ-o3-100-50,drreact-summ-o3-150-50,\
\
o4-mini,\
react-o4-mini-1,react-o4-mini-5,react-o4-mini-10,\
search-o1-tool-o4-mini-1,search-o1-tool-o4-mini-5,search-o1-tool-o4-mini-10,search-o1-tool-o4-mini-25,search-o1-tool-o4-mini-50,search-o1-tool-o4-mini-100,\
hf-odr-o4-mini,gpt-researcher-o4-mini,\
drreact-o4-mini-10,drreact-o4-mini-25,drreact-o4-mini-50,drreact-o4-mini-100,\
drreact-summ-o4-mini-100-50,drreact-summ-o4-mini-150-50,\
\
claude-4-sonnet,\
react-claude-4-sonnet-1,react-claude-4-sonnet-5,react-claude-4-sonnet-10,\
search-o1-tool-claude-4-sonnet-1,search-o1-tool-claude-4-sonnet-5,search-o1-tool-claude-4-sonnet-10,search-o1-tool-claude-4-sonnet-25,search-o1-tool-claude-4-sonnet-50,search-o1-tool-claude-4-sonnet-100,\
hf-odr-claude-4-sonnet,gpt-researcher-claude-4-sonnet,\
drreact-claude-4-sonnet-10,drreact-claude-4-sonnet-25,drreact-claude-4-sonnet-50,drreact-claude-4-sonnet-100,\
drreact-summ-claude-4-sonnet-100-50,drreact-summ-claude-4-sonnet-150-50,\
    --evals hle_text,browsecomp \
    --output-dir simple-evals/outputs --tag v2_300 --output-csv simple-evals/outputs/leaderboard.csv --seeds 1


#ls simple-evals/outputs/drreact-summ-o3-100-50
#ls simple-evals/outputs/drreact-summ-o3-150-50
python simple-evals/scripts/collect_results.py \
    --models drreact-summ-o3-100-50,drreact-summ-o3-150-50 \
    --evals hle_text,browsecomp \
    --output-dir simple-evals/outputs --tag v3_300 --output-csv simple-evals/outputs/leaderboard.csv --seeds 1

