set -e

# Configuration
MODEL_PATH="Qwen/Qwen2-VL-7B-Instruct"
MODEL_NAME="qwen2_vl_tasm"
TIMESTAMP=$(date +%Y%m%d_%H%M%S)

# Setup environment
export PYTHONPATH="$(pwd)/lmms-eval:$(pwd)/transformers/src:$PYTHONPATH"

# Function to run ImageNet evaluation
run_imagenet() {
    echo "============================================"
    echo "TASM - ImageNet-100 Few-shot Evaluation"
    echo "============================================"
    
    OUTPUT_PATH="./logs/tasm_imagenet_${TIMESTAMP}"
    mkdir -p "${OUTPUT_PATH}"
    
    # TASM full configuration
    MODEL_ARGS="pretrained=${MODEL_PATH}"
    MODEL_ARGS="${MODEL_ARGS},num_fewshot=20"
    MODEL_ARGS="${MODEL_ARGS},task_vector_method=combined"
    
    # Token merging settings
    MODEL_ARGS="${MODEL_ARGS},enable_token_merging=True"
    MODEL_ARGS="${MODEL_ARGS},merge_similarity_threshold=0.5"
    MODEL_ARGS="${MODEL_ARGS},preserve_spatial=True"
    
    # Dynamic retrieval settings
    MODEL_ARGS="${MODEL_ARGS},enable_dynamic_retrieval=True"
    MODEL_ARGS="${MODEL_ARGS},core_compression_ratio=0.1"
    MODEL_ARGS="${MODEL_ARGS},latent_compression_ratio=0.5"
    MODEL_ARGS="${MODEL_ARGS},retrieval_top_k=32"
    
    # Compression settings
    MODEL_ARGS="${MODEL_ARGS},target_compression_ratio=0.2"
    MODEL_ARGS="${MODEL_ARGS},js_threshold=0.005"
    MODEL_ARGS="${MODEL_ARGS},attn_implementation=sdpa"
    
    accelerate launch --num_processes 1 -m lmms_eval \
        --model ${MODEL_NAME} \
        --model_args "${MODEL_ARGS}" \
        --tasks imagenet_100_fewshot \
        --batch_size 1 \
        --output_path ${OUTPUT_PATH} \
        --log_samples
    
    echo "Results saved to: ${OUTPUT_PATH}"
}

# Main execution
run_imagenet

echo "Done!"
