
#!/bin/bash
exps=(baseline_reasoning_v2_13b_20230925191622 baseline_reasoning_v2_7b_20230925185939 vicuna_13b_v1_5 vicuna_7b_v1_5 wizardlm_13b_v1_2 wizardmath_13b_v1_0 wizardmath_7b_v1_0)
for exp in "${exps[@]}"; do
    make eval_lm_harness  TASK=piqa EXP=${exp}
done




exit
all_exps=(baseline_reasoning_v2_13b_20230925191622 baseline_reasoning_v2_7b_20230925185939 vicuna_13b_v1_5 vicuna_7b_v1_5 wizardlm_13b_v1_2 wizardmath_13b_v1_0 wizardmath_7b_v1_0)
    

exp=vicuna_13b_v1_5
missing=(math_algebra math_counting_and_prob math_geometry math_intermediate_algebra math_num_theory math_prealgebra math_precalc bigbench_tracking_shuffled_objects_three_object)
# exp=vicuna_7b_v1_5
# missing=(bigbench_tracking_shuffled_objects_three_object)
# exp=wizardlm_13b_v1_2
# missing=(math_algebra math_counting_and_prob math_geometry math_intermediate_algebra math_num_theory math_prealgebra math_precalc squad2 bigbench_tracking_shuffled_objects_three_object hendrycksTest-college_mathematics hendrycksTest-high_school_european_history hendrycksTest-high_school_government_and_politics hendrycksTest-moral_disputes)
# exp=wizardmath_13b_v1_0
# missing=(math_algebra math_counting_and_prob math_geometry math_intermediate_algebra math_num_theory math_prealgebra math_precalc squad2 bigbench_date_understanding bigbench_tracking_shuffled_objects_three_object hendrycksTest-high_school_statistics hendrycksTest-medical_genetics hendrycksTest-nutrition hendrycksTest-public_relations)
# exp=wizardmath_7b_v1_0
# missing=(math_geometry squad2 bigbench_tracking_shuffled_objects_three_object hendrycksTest-high_school_government_and_politics hendrycksTest-high_school_psychology hendrycksTest-human_sexuality hendrycksTest-moral_scenarios hendrycksTest-nutrition)

for task in "${missing[@]}"; do
    make eval_lm_harness  TASK=${task} EXP=${exp}
done
