python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/related_word_language_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_language_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/related_word_language_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_language_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/related_word_language_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_language_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_word_language_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_language_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_word_language_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_language_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_word_language_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_language_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_str_language_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_language_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_str_language_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_language_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_str_language_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_language_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_symbolic_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_symbolic_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_symbolic_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_symbolic_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_symbolic_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_symbolic_2.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_symbolic_0.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_symbolic_1.jsonl
python predict_dataset_by_LLMs.py --dataset LabelClassificationSubset   --prompt_path ./prompts/LabelClassification/test.json --prompt_id CoT --api_name ollama_qwen2_7b --error_extraction_count 1 --data_type datasets/nm_CoT_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_symbolic_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name related_word_language_0 --data_type datasets/nm_CoT_eval/related_word_language_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_language_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name related_word_language_1 --data_type datasets/nm_CoT_eval/related_word_language_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_language_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name related_word_language_2 --data_type datasets/nm_CoT_eval/related_word_language_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_language_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_word_language_0 --data_type datasets/nm_CoT_eval/random_word_language_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_language_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_word_language_1 --data_type datasets/nm_CoT_eval/random_word_language_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_language_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_word_language_2 --data_type datasets/nm_CoT_eval/random_word_language_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_language_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_str_language_0 --data_type datasets/nm_CoT_eval/random_str_language_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_language_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_str_language_1 --data_type datasets/nm_CoT_eval/random_str_language_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_language_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_str_language_2 --data_type datasets/nm_CoT_eval/random_str_language_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_language_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_str_symbolic_0 --data_type datasets/nm_CoT_eval/random_str_symbolic_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_symbolic_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_str_symbolic_1 --data_type datasets/nm_CoT_eval/random_str_symbolic_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_symbolic_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_str_symbolic_2 --data_type datasets/nm_CoT_eval/random_str_symbolic_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_str_symbolic_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_word_symbolic_0 --data_type datasets/nm_CoT_eval/random_word_symbolic_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_symbolic_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_word_symbolic_1 --data_type datasets/nm_CoT_eval/random_word_symbolic_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_symbolic_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name random_word_symbolic_2 --data_type datasets/nm_CoT_eval/random_word_symbolic_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/random_word_symbolic_2.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name related_word_symbolic_0 --data_type datasets/nm_CoT_eval/related_word_symbolic_0.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_symbolic_0.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name related_word_symbolic_1 --data_type datasets/nm_CoT_eval/related_word_symbolic_1.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_symbolic_1.jsonl
python evaluate.py --dataset LabelClassificationSubset --wandb --wandb_model_path_name prediction_path --wandb_project_name ASP_nm_CoT_eval --model ollama_qwen2_7b --wandb_work_name related_word_symbolic_2 --data_type datasets/nm_CoT_eval/related_word_symbolic_2.jsonl --prediction_path ./predictions/nm_CoT_eval/LabelClassification/ollama_qwen2_7b/related_word_symbolic_2.jsonl
