python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/related_word_language_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_language_0.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/related_word_language_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_language_1.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/related_word_language_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_language_2.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_word_language_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_language_0.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_word_language_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_language_1.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_word_language_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_language_2.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_str_language_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_language_0.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_str_language_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_language_1.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_str_language_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_language_2.jsonl --prompt_id direct_language
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_symbolic_0.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_symbolic_1.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_symbolic_2.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_symbolic_0.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_symbolic_1.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_symbolic_2.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_symbolic_0.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_symbolic_1.jsonl --prompt_id direct_symbolic
python predict_dataset_by_LLMs.py --dataset AnswerSetGeneration   --prompt_path ./prompts/AnswerSetGeneration/test.json --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/generation_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_symbolic_2.jsonl --prompt_id direct_symbolic
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name related_word_language_0 --data_type datasets/generation_eval/related_word_language_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_language_0.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name related_word_language_1 --data_type datasets/generation_eval/related_word_language_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_language_1.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name related_word_language_2 --data_type datasets/generation_eval/related_word_language_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_language_2.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_word_language_0 --data_type datasets/generation_eval/random_word_language_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_language_0.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_word_language_1 --data_type datasets/generation_eval/random_word_language_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_language_1.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_word_language_2 --data_type datasets/generation_eval/random_word_language_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_language_2.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_str_language_0 --data_type datasets/generation_eval/random_str_language_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_language_0.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_str_language_1 --data_type datasets/generation_eval/random_str_language_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_language_1.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_str_language_2 --data_type datasets/generation_eval/random_str_language_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_language_2.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_str_symbolic_0 --data_type datasets/generation_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_symbolic_0.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_str_symbolic_1 --data_type datasets/generation_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_symbolic_1.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_str_symbolic_2 --data_type datasets/generation_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_str_symbolic_2.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_word_symbolic_0 --data_type datasets/generation_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_symbolic_0.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_word_symbolic_1 --data_type datasets/generation_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_symbolic_1.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name random_word_symbolic_2 --data_type datasets/generation_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/random_word_symbolic_2.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name related_word_symbolic_0 --data_type datasets/generation_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_symbolic_0.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name related_word_symbolic_1 --data_type datasets/generation_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_symbolic_1.jsonl
python evaluate_generation.py --dataset AnswerSetGeneration --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_ASG_generation_eval --model claude_3_haiku --wandb_work_name related_word_symbolic_2 --data_type datasets/generation_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/generation_eval/AnswerSetGeneration/claude_3_haiku/related_word_symbolic_2.jsonl
