export BASE=clean_conv_20230809_1.5M_pii
export SCALE=1

python3 filter_bad_conv.py --in $BASE.json --sample 1000000

python3 final_post_processing.py --in $BASE.s1.json

python3 upload_hf_dataset.py --in $BASE.s1.s2.json

python3 merge_oai_tag.py --in $BASE.s1.s2.json

python3 compute_stats.py --in $BASE.s1.json --scale $SCALE
