#!/bin/bash
set -e

mkdir -p datasets
cd datasets

echo "Downloading CIFAR-10..."
wget -q --show-progress https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz
tar -xvf cifar-10-python.tar.gz
rm cifar-10-python.tar.gz

echo "Downloading Long Range Arena (LRA) release..."
echo "NOTE: The original Google Cloud Storage link (storage.googleapis.com/long-range-arena/lra_release.gz)"
echo "      may return 403 Forbidden. If the download below fails, you can obtain the LRA data from:"
echo "      - https://github.com/google-research/long-range-arena (archived, may have mirrors)"
echo "      - https://github.com/lucaslingle/e-lra (maintained fork with automated downloads)"
echo "      Place the extracted lra_release/ directory inside this datasets/ folder."
wget -q --show-progress -O lra_release.gz https://storage.googleapis.com/long-range-arena/lra_release.gz || {
    rm -f lra_release.gz
    echo "ERROR: LRA download failed. See notes above for alternative sources."
    echo "       After obtaining lra_release.gz manually, run: tar -xvf lra_release.gz"
}
if [ -s lra_release.gz ]; then
    tar -xvf lra_release.gz
    rm lra_release.gz
fi

echo "Downloading IMDb sentiment dataset..."
wget -q --show-progress https://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz
tar -xvf aclImdb_v1.tar.gz
rm aclImdb_v1.tar.gz

echo "Done. Dataset directory structure:"
ls -d */
