from evaluate import eval_wtq,eval_tabfact
'''
print('tabfact_agent_sql:')
eval_tabfact(
    checkpoints="/home/yangzhen/code/trillm/output/tab_agent_triple/result.jsonl",
    n_times=1
)
#
print('tabfact_cot_sql:')
eval_tabfact(
    checkpoints="/home/yangzhen/code/trillm/output/tab_cot_triple/result.jsonl",
    n_times=1
)
#
print('tabfact_triple_valid and tabfact_cot_sql:')
eval_tabfact(
    checkpoints=["/home/yangzhen/code/trillm/output/tab_agent_triple/result.jsonl","/home/yangzhen/code/trillm/output/tab_cot_triple/result.jsonl"],
    elements_per_checkpoint=[5,3],
    n_times=1
)

print('wtq_triple_valid:')
eval_wtq(
    checkpoints="/home/yangzhen/code/trillm/output/wtq_triple_valid/result.jsonl",
    n_times=1
)
print('wtq_agent_triple:')
eval_wtq(
    checkpoints="/home/yangzhen/code/trillm/output/wtq_agent_triple/result.jsonl",
    n_times=1
)
eval_wtq(
    checkpoints=["/home/yangzhen/code/trillm/output/wtq_triple_valid/result.jsonl","/home/yangzhen/code/trillm/output/wtq_agent_triple/result.jsonl"],
    elements_per_checkpoint=[3,5],
    n_times=1
)
'''
print('tabfact_triple_valid and tabfact_cot_sql:')
eval_tabfact(
    checkpoints=["/home/yangzhen/code/trillm/output/tab_agent_triple/result.jsonl","/home/yangzhen/code/trillm/output/tab_cot_triple/result.jsonl"],
    elements_per_checkpoint=[5,5],
    n_times=10
)

eval_wtq(
    checkpoints=["/home/yangzhen/code/trillm/output/wtq_triple_valid/result.jsonl","/home/yangzhen/code/trillm/output/wtq_agent_triple/result.jsonl"],
    elements_per_checkpoint=[5,5],
    n_times=10
)
