# Data
.PHONY: sync-results
sync-results:
	@echo "Syncing results from NGC"
	rm -rf scratch/amine_ws/exp_results
	ngc workspace download amine_ws --dir exp_results  --dest scratch
	

# Training
TRAIN_REQUIRED_ARGS := MIX_NAME MODEL_NAME
.PHONY: train
train:
	@$(foreach var,$(TRAIN_REQUIRED_ARGS),\
			$(if $(value $(var)),,$(error $(var) is not set)))
	@echo "Training with MIX_NAME=$(MIX_NAME) MODEL_NAME=$(MODEL_NAME)"
	NGC_GPU_CNT=8 ./scripts/ngc/run_cmd.sh scripts/ngc/ss_train.sh \
	--mixture_name $(MIX_NAME) \
	--model_name_or_path $(MODEL_NAME) \
    --hp_config oi_no_lora_hp \
    --num_train_epochs 15 \
	--checkpointing_steps epoch

.PHONY: train_qlora
train_qlora:
	@$(foreach var,$(TRAIN_REQUIRED_ARGS),\
			$(if $(value $(var)),,$(error $(var) is not set)))
	@echo "Training with MIX_NAME=$(MIX_NAME) MODEL_NAME=$(MODEL_NAME)"
	NGC_GPU_CNT=8 ./scripts/ngc/run_cmd.sh scripts/ngc/ss_train.sh \
	--mixture_name $(MIX_NAME) \
	--model_name_or_path $(MODEL_NAME) \
    --hp_config oi_qlora_hp \
    --num_train_epochs 15 \
	--checkpointing_steps epoch

SS_TRAIN_REQUIRED_ARGS := MIX_NAME SS_CONFIG MODEL_NAME
.PHONY: ss_train
ss_train:
	@$(foreach var,$(SS_TRAIN_REQUIRED_ARGS),\
			$(if $(value $(var)),,$(error $(var) is not set)))
	@echo "Training with SS with MIX_NAME=$(MIX_NAME) SS_CONFIG=$(SS_CONFIG) MODEL_NAME=$(MODEL_NAME)"
	NGC_GPU_CNT=8 ./scripts/ngc/run_cmd.sh scripts/ngc/ss_train.sh \
	--mixture_name $(MIX_NAME) \
	--ss_config $(SS_CONFIG) \
	--model_name_or_path $(MODEL_NAME) \
    --hp_config oi_hp \


# Evaluations
.PHONY: eval_gsm
eval_gsm:
ifndef EXP 
	$(error EXP is not set)
endif
	@echo "Evaluating math"
	NGC_GPU_CNT=1 ./scripts/ngc/run_cmd.sh scripts/eval/eval_wizzard_gsm.sh $(EXP)


.PHONY: eval_math
eval_math:
ifndef EXP 
	$(error EXP is not set)
endif
	@echo "Evaluating math"
	NGC_GPU_CNT=8 ./scripts/ngc/run_cmd.sh scripts/eval/eval_wizzard_math.sh $(EXP)

LM_EVAL_REQUIRED_ARGS := EXP TASK
LM_EVAL_MATH_TASKS := math_algebra math_counting_and_prob math_geometry math_intermediate_algebra math_num_theory math_prealgebra math_precalc
LM_EVAL_TASKS := piqa winogrande arc_easy arc_challenge openbookqa hellaswag triviaqa squad2 boolq truthfulqa_mc toxigen \
	$(LM_EVAL_MATH_TASKS) \
	bigbench_causal_judgement bigbench_date_understanding bigbench_disambiguation_qa bigbench_dyck_languages bigbench_formal_fallacies_syllogisms_negation \
	bigbench_geometric_shapes bigbench_hyperbaton bigbench_logical_deduction_five_objects bigbench_logical_deduction_seven_objects bigbench_logical_deduction_three_objects \
	bigbench_movie_recommendation bigbench_navigate bigbench_reasoning_about_colored_objects bigbench_ruin_names bigbench_salient_translation_error_detection bigbench_snarks \
	bigbench_sports_understanding bigbench_temporal_sequences bigbench_tracking_shuffled_objects_five_objects \
	bigbench_tracking_shuffled_objects_seven_objects bigbench_tracking_shuffled_objects_three_objects \
    hendrycksTest-abstract_algebra hendrycksTest-anatomy hendrycksTest-astronomy hendrycksTest-business_ethics hendrycksTest-clinical_knowledge \
	hendrycksTest-college_biology hendrycksTest-college_chemistry hendrycksTest-college_computer_science hendrycksTest-college_mathematics \
	hendrycksTest-college_medicine hendrycksTest-college_physics hendrycksTest-computer_security hendrycksTest-conceptual_physics \
	hendrycksTest-econometrics hendrycksTest-electrical_engineering hendrycksTest-elementary_mathematics hendrycksTest-formal_logic \
	hendrycksTest-global_facts hendrycksTest-high_school_biology hendrycksTest-high_school_chemistry hendrycksTest-high_school_computer_science \
	hendrycksTest-high_school_european_history hendrycksTest-high_school_geography hendrycksTest-high_school_government_and_politics \
	hendrycksTest-high_school_macroeconomics hendrycksTest-high_school_mathematics hendrycksTest-high_school_microeconomics hendrycksTest-high_school_physics \
	hendrycksTest-high_school_psychology hendrycksTest-high_school_statistics hendrycksTest-high_school_us_history hendrycksTest-high_school_world_history \
	hendrycksTest-human_aging hendrycksTest-human_sexuality hendrycksTest-international_law hendrycksTest-jurisprudence hendrycksTest-logical_fallacies \
	hendrycksTest-machine_learning hendrycksTest-management hendrycksTest-marketing hendrycksTest-medical_genetics hendrycksTest-miscellaneous \
	hendrycksTest-moral_disputes hendrycksTest-moral_scenarios hendrycksTest-nutrition hendrycksTest-philosophy hendrycksTest-prehistory \
	hendrycksTest-professional_accounting hendrycksTest-professional_law hendrycksTest-professional_medicine hendrycksTest-professional_psychology \
	hendrycksTest-public_relations hendrycksTest-security_studies hendrycksTest-sociology hendrycksTest-us_foreign_policy hendrycksTest-virology hendrycksTest-world_religions

LM_EVAL_TASKS_CNT := $(shell echo $(LM_EVAL_TASKS) | tr ' ' '\n' | wc -l)

.PHONY: eval_lm_harness
eval_lm_harness:
	@$(foreach var,$(LM_EVAL_REQUIRED_ARGS),\
			$(if $(value $(var)),,$(error $(var) is not set)))

ifeq ($(TASK),all_math)
	@$(foreach curr_task,$(LM_EVAL_MATH_TASKS),\
		echo "Running $(curr_task)"; \
		NGC_GPU_CNT=1 NGC_RUN_NAME=eval_$(curr_task)_$(EXP) ./scripts/ngc/run_cmd.sh scripts/eval/eval_hf_llm.sh $(EXP) $(curr_task); \
	)
else
ifeq ($(TASK),all)
	@$(foreach curr_task,$(LM_EVAL_TASKS),\
		echo "Running $(curr_task)"; \
		NGC_GPU_CNT=1 NGC_RUN_NAME=eval_$(curr_task)_$(EXP) ./scripts/ngc/run_cmd.sh scripts/eval/eval_hf_llm.sh $(EXP) $(curr_task); \
	)
else
ifeq (,$(filter $(TASK),$(LM_EVAL_TASKS)))
	$(error TASK is not a known task name $(TASK). Valid=$(LM_EVAL_TASKS))
endif
	@echo "Evaluating $(TASK) for $(EXP) using HF LM eval harness"
	NGC_GPU_CNT=1 NGC_RUN_NAME=eval_$(TASK)_$(EXP) ./scripts/ngc/run_cmd.sh scripts/eval/eval_hf_llm.sh $(EXP) $(TASK) 
endif
endif

.PHONY: eval_lm_tasks
eval_lm_tasks:
	@echo "Total LM_EVAL_TASKS=$(LM_EVAL_TASKS_CNT)"
	
