#!/bin/bash

echo "preparing ImageNet dataset in $SLURM_TMPDIR"
start=`date +%s`

if [ ! -d $SLURM_TMPDIR/ImageNet/val ]; then
    echo "copying imagenet_val.tar to $SLURM_TMPDIR"
    cp $project/dataset/imagenet_val.tar $SLURM_TMPDIR
    echo "extracting imagenet_val.tar to $SLURM_TMPDIR"
    tar -xf $SLURM_TMPDIR/imagenet_val.tar -C $SLURM_TMPDIR && rm -f $SLURM_TMPDIR/imagenet_val.tar
else
    echo "ImageNet val dataset already exists in $SLURM_TMPDIR, skipping extraction"
fi

if [ ! -d $SLURM_TMPDIR/ImageNet/train ]; then
    echo "copying imagenet_train.tar to $SLURM_TMPDIR"
    echo "Running on $SLURM_SUBMIT_HOST"
    cp $project/dataset/imagenet_train.tar $SLURM_TMPDIR
    echo "extracting imagenet_train.tar to $SLURM_TMPDIR"
    tar -xf $SLURM_TMPDIR/imagenet_train.tar -C $SLURM_TMPDIR && rm -f $SLURM_TMPDIR/imagenet_train.tar
    fi
else
    echo "ImageNet train dataset already exists in $SLURM_TMPDIR, skipping extraction"
fi

end=`date +%s`
echo "ImageNet dataset prepared in $((end - start)) seconds"