#!/bin/bash
set -e

timestamp=$(date +%Y%m%d_%H%M%S)
exp_name=causal_v4_${timestamp}
output_path=outputs/${exp_name}
model_path=/root/autodl-tmp/KnowSelf-main/output/knowself_llama3-8b-alfworld-rpo_merged/

mkdir -p ${output_path}

echo "🧪 因果推理测试 v4（清晰版）"
echo "  测试任务数: 5"
echo "  输出路径: ${output_path}"
echo ""

VLLM_WORKER_MULTIPROC_METHOD=spawn CUDA_VISIBLE_DEVICES=0 \
python -m eval_agent.knowself_eval_vllm_alfworld_causal_v4_clean \
    --gpu_num 1 \
    --exp_config alfworld \
    --output_path ${output_path} \
    --select_agent_config deepseek \
    --select_agent_name deepseek-chat \
    --model_name_or_path ${model_path} \
    --select_knowledge_inst eval_agent/prompt/instructions/select_knowledge_alfworld.txt \
    --knowledge_base_path knowledge_system_construction/automanual_alfworld/autobuild_logs/rule_manager.json \
    --model_type llama3 \
    --split test \
    --part_num 5 \
    --part_idx 0 \
    --enable_causal_reasoning \
    --causal_max_hypotheses 2 \
    --causal_validation_threshold 0.45 \
    --causal_action_weight 0.7 \
    --verbose \
    --override

echo ""
echo "✅ 测试完成！"
echo ""
echo "📊 查看结果:"
echo "  tail -50 ${output_path}/log.txt"
echo ""
echo "🔍 验证因果字段

echo "  python3 << 'PYEOF'
import json
import os

output_dir = '${output_path}'
json_files = [f for f in os.listdir(output_dir) if f.endswith('.json') and f != 'causal_knowledge_base.json']

if json_files:
    sample_file = os.path.join(output_dir, json_files[0])
    with open(sample_file, encoding='utf-8') as f:
        data = json.load(f)
    
    print('\\n✅ 示例JSON结构:')
    print(f'  文件: {json_files[0]}')
    print(f'  顶层字段: {list(data.keys())}')
    
    if 'causal_steps' in data:
        print(f'\\n🔬 因果字段:')
        print(f'  causal_steps: {len(data.get(\"causal_steps\", []))} 步')
        print(f'  causal_actions_used: {data.get(\"causal_actions_used\", 0)}')
        print(f'  causal_adoption_rate: {data.get(\"causal_adoption_rate\", 0)*100:.1f}%')
        
        if data['causal_steps']:
            print(f'\\n📋 第一个因果步骤:')
            step = data['causal_steps'][0]
            for k, v in step.items():
                if isinstance(v, list):
                    print(f'  • {k}: {len(v)} items')
                else:
                    print(f'  • {k}: {str(v)[:60]}')
    else:
        print('\\n❌ 缺少因果字段！')
else:
    print('\\n⚠️ 未找到JSON文件')
PYEOF
"

echo ""
echo "📁 所有输出文件:"
echo "  ls -lh ${output_path}/"
