python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/related_word_language_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_language_0.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/related_word_language_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_language_1.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/related_word_language_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_language_2.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_word_language_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_language_0.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_word_language_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_language_1.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_word_language_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_language_2.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_str_language_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_language_0.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_str_language_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_language_1.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_str_language_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_language_2.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_symbolic_0.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_symbolic_1.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_symbolic_2.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_symbolic_0.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_symbolic_1.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_symbolic_2.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_symbolic_0.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_symbolic_1.jsonl

python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name claude_3_haiku --error_extraction_count 3 --data_type datasets/normal_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_symbolic_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name related_word_language_0 --data_type datasets/normal_eval/related_word_language_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_language_0.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name related_word_language_1 --data_type datasets/normal_eval/related_word_language_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_language_1.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name related_word_language_2 --data_type datasets/normal_eval/related_word_language_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_language_2.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_word_language_0 --data_type datasets/normal_eval/random_word_language_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_language_0.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_word_language_1 --data_type datasets/normal_eval/random_word_language_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_language_1.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_word_language_2 --data_type datasets/normal_eval/random_word_language_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_language_2.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_str_language_0 --data_type datasets/normal_eval/random_str_language_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_language_0.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_str_language_1 --data_type datasets/normal_eval/random_str_language_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_language_1.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_str_language_2 --data_type datasets/normal_eval/random_str_language_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_language_2.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_str_symbolic_0 --data_type datasets/normal_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_symbolic_0.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_str_symbolic_1 --data_type datasets/normal_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_symbolic_1.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_str_symbolic_2 --data_type datasets/normal_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_str_symbolic_2.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_word_symbolic_0 --data_type datasets/normal_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_symbolic_0.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_word_symbolic_1 --data_type datasets/normal_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_symbolic_1.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name random_word_symbolic_2 --data_type datasets/normal_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/random_word_symbolic_2.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name related_word_symbolic_0 --data_type datasets/normal_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_symbolic_0.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name related_word_symbolic_1 --data_type datasets/normal_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_symbolic_1.jsonl

python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_CoT_eval --model claude_3_haiku --wandb_work_name related_word_symbolic_2 --data_type datasets/normal_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/CoT_eval/LabelClassification/claude_3_haiku/related_word_symbolic_2.jsonl
