#!/bin/bash

#=========================================#
echo 'This file has been scrubbed to maintain anonymity during the review process.'

#=========================================#
PROJ_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)
DATA_DIR=${PROJ_DIR}/data
export HF_HOME=${DATA_DIR}/huggingface

mkdir -p ${DATA_DIR}
cd ${DATA_DIR}

#=========================================#
# # Check if authenticated with Hugging Face
# echo "Checking Hugging Face authentication..."
# HF_STATUS=$(uv run hf whoami 2>&1)
# if echo "$HF_STATUS" | grep -q "Not logged in"; then
#     echo "❌ Not logged in to Hugging Face!"
#     echo "Please run: uv run hf login"
#     echo "You'll need a Hugging Face account and token (URL anonymized for review)"
#     exit 1
# fi

# echo "✅ Authenticated with Hugging Face"

#=========================================#
# Geo-FNO
#=========================================#
mkdir -p Geo-FNO
echo "Downloading Geo-FNO dataset..."
uv run hf download --repo-type dataset ANON/PDE_DATASET Geo-FNO.tar.gz --local-dir .
echo "Extracting Geo-FNO dataset..."
tar -xzf Geo-FNO.tar.gz
rm -rf Geo-FNO.tar.gz

#=========================================#
# FNO
#=========================================#
mkdir -p FNO
echo "Downloading FNO dataset..."
uv run hf download --repo-type dataset ANON/PDE_DATASET FNO.tar.gz --local-dir .
echo "Extracting FNO dataset..."
tar -xzf FNO.tar.gz
rm -rf FNO.tar.gz

#=========================================#
# SHAPENET-CAR
#=========================================#
mkdir -p ShapeNet-Car
echo "Downloading ShapeNet-Car dataset..."
cd ShapeNet-Car
wget http://www.nobuyuki-umetani.com/publication/mlcfd_data.zip
unzip mlcfd_data.zip
rm -rf __MACOSX
cd mlcfd_data
cd training_data
tar -xvzf param0.tar.gz
tar -xvzf param1.tar.gz
tar -xvzf param2.tar.gz
tar -xvzf param3.tar.gz
tar -xvzf param4.tar.gz
tar -xvzf param5.tar.gz
tar -xvzf param6.tar.gz
tar -xvzf param7.tar.gz
tar -xvzf param8.tar.gz
# remove folders without quadpress_smpl.vtk
rm -rf ./param2/854bb96a96a4d1b338acbabdc1252e2f
rm -rf ./param2/85bb9748c3836e566f81b21e2305c824
rm -rf ./param5/9ec13da6190ab1a3dd141480e2c154d3
rm -rf ./param8/c5079a5b8d59220bc3fb0d224baae2a

rm -rf mlcfd_data.zip
rm -rf mlcfd_data/training_data/*tar.gz

cd $DATA_DIR

#=========================================#
# DRIVAERML
#=========================================#
mkdir -p DrivAerML
echo "Downloading and extracting DrivAerML dataset..."

cd DrivAerML

for num_points in 10k 40k 100k 200k 300k 400k 500k 1m; do
    uv run hf download --repo-type dataset ANON/PDE_DATASET drivaerml_surface_presampled_${num_points}.tar.gz --local-dir .
    tar -xzf drivaerml_surface_presampled_${num_points}.tar.gz
    rm -rf drivaerml_surface_presampled_${num_points}.tar.gz
done

cd $DATA_DIR

#=========================================#
#