import sys
from pathlib import Path
import logger
import time
from llm import LLM
from prompt.start import START_SYSTEM_PROMPT
import utils
import globals


# run_worker: python run_worker.py <run_id> <requirement>
def _find_latest_result_dir(results_root: Path) -> Path:
    dirs = [p for p in results_root.iterdir() if p.is_dir()]
    if not dirs:
        return None
    dirs.sort(key=lambda p: p.stat().st_mtime, reverse=True)
    return dirs[0]


if __name__ == '__main__':
    if len(sys.argv) < 3:
        print('usage: run_worker.py <run_id> <requirement>')
        sys.exit(2)
    run_id = sys.argv[1]
    # requirement 可能包含空格，取剩余所有参数并用空格连接
    requirement = " ".join(sys.argv[2:])

    # 初始化独立日志文件
    logger.init(log_filename=f'run_{run_id}.log')
    # logger.info(f'[Worker] start {run_id} requirement={requirement}')

    try:
        # 延迟导入以减少启动错误
        # 设置 RUN_ID 环境变量，供执行时的工具知晓当前 run
        import os
        os.environ.setdefault("RUN_ID", run_id)

        # 使用 ask_with_tools 入口，由模型自主决定是否调用 run_datascience
        logger.debug(
            f"【API 配置】: {utils.active_api_config},",
        )
        llm = LLM(config_name=utils.active_api_config)
        messages = [
            {"role": "system", "content": START_SYSTEM_PROMPT},
            {"role": "user", "content": requirement+"\n run_id 为 "+run_id},
        ]
        tool_names = ["run_datascience"]
        if getattr(utils.module_config, 'web_datadownload_tool', False):
            tool_names.insert(0, "web_search_summarize")
        response = llm.ask_with_tools(
            messages=messages,
            tool_names=tool_names,
            max_loops=4,
        )
    except Exception as e:
        logger.error(f'[Worker] failed {run_id}: {e}')
        import traceback
        traceback.print_exc()
    finally:
        # 打印本次 run 的 LLM Token 累计消耗
        logger.log_token_summary()
        # logger.info(f'[Worker] exiting {run_id}')