#!/bin/bash
# filepath: /paper/prepare_corpus.sh

# Usage:
#   ./prepare_corpus.sh imdb
#   ./prepare_corpus.sh 1billion

set -e

echo "Selecting dataset..."
if [ "$1" == "imdb" ]; then
    echo "Using IMDB dataset"
    DATASET="imdb"
elif [ "$1" == "1billion" ]; then
    echo "Using 1 billion words dataset"
    DATASET="1billion"
else
    echo "Invalid dataset. Use 'imdb' or '1billion'."
    exit 1
fi
python3 prepare_corpus.py --dataset_name $DATASET
python3 embedding-generator/main.py --dataset_name $DATASET
python3 classification/main.py --dataset_name $DATASET
python3 clustering/main.py --dataset_name $DATASET
python3 similarities/main.py --dataset_name $DATASET