python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/related_word_language_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_language_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/related_word_language_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_language_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/related_word_language_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_language_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_word_language_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_language_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_word_language_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_language_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_word_language_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_language_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_str_language_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_language_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_str_language_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_language_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_str_language_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_language_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_symbolic_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_symbolic_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_symbolic_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_symbolic_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_symbolic_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_symbolic_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_symbolic_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_symbolic_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id direct --api_name o1_mini --error_extraction_count 1 --temperature 1 --data_type datasets/small_nm_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_symbolic_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name related_word_language_0 --data_type datasets/small_nm_eval/related_word_language_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_language_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name related_word_language_1 --data_type datasets/small_nm_eval/related_word_language_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_language_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name related_word_language_2 --data_type datasets/small_nm_eval/related_word_language_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_language_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_word_language_0 --data_type datasets/small_nm_eval/random_word_language_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_language_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_word_language_1 --data_type datasets/small_nm_eval/random_word_language_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_language_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_word_language_2 --data_type datasets/small_nm_eval/random_word_language_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_language_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_str_language_0 --data_type datasets/small_nm_eval/random_str_language_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_language_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_str_language_1 --data_type datasets/small_nm_eval/random_str_language_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_language_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_str_language_2 --data_type datasets/small_nm_eval/random_str_language_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_language_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_str_symbolic_0 --data_type datasets/small_nm_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_symbolic_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_str_symbolic_1 --data_type datasets/small_nm_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_symbolic_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_str_symbolic_2 --data_type datasets/small_nm_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_str_symbolic_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_word_symbolic_0 --data_type datasets/small_nm_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_symbolic_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_word_symbolic_1 --data_type datasets/small_nm_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_symbolic_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name random_word_symbolic_2 --data_type datasets/small_nm_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/random_word_symbolic_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name related_word_symbolic_0 --data_type datasets/small_nm_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_symbolic_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name related_word_symbolic_1 --data_type datasets/small_nm_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_symbolic_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_small_nm_eval --model o1_mini --wandb_work_name related_word_symbolic_2 --data_type datasets/small_nm_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/small_nm_eval/LabelClassification/o1_mini/related_word_symbolic_2.jsonl
