#!/bin/bash
set -x
source consts.sh

export CUDA_VISIBLE_DEVICES=5

TASK_NAME=cola
MODEL_NAME=bert-large-cased
NUM_EXPERTS=8
MOE_LAYERS="10"
SEEDS="0"
LR="2e-5"
REPEAT=8
TIME=$(date "+%Y%m%d-%H%M%S")
GATE=star

output_dir=logs/${TASK_NAME}/${MODEL_NAME}/${GATE}/moe_${NUM_EXPERTS}_layers${MOE_LAYERS}_repeat${REPEAT}/${TIME}

python Language/search_glue_no_trainer.py \
    --model_name_or_path $MODEL_NAME \
    --task_name $TASK_NAME \
    --to_MoE \
    --seeds $SEEDS \
    --num_experts $NUM_EXPERTS \
    --learning_rates $LR \
    --moe_layers $MOE_LAYERS \
    --expert_repeat $REPEAT \
    --gate_type $GATE \
    # --save_model \

