#!/bin/bash
# Ablation: Train grasp encoder with recon_loss + kl_loss only (NO DTW)
# This tests if reconstruction + KL regularization alone can learn meaningful latents

cd /home/placeholder/dsrl/dppo/RLBench_grasp/encoder

# Enable wandb logging (comment to disable)
# export WANDB_MODE=disabled

python train_grasp_encoder.py \
    --horizon=107 \
    --latent_dim=2 \
    --hidden_dim=128 \
    --num_layers=4 \
    --num_heads=4 \
    --batch_size=32 \
    --num_epochs=5000 \
    --lr=1e-4 \
    --recon_weight=1.0 \
    --kl_weight=0.001 \
    --dtw_weight=0.0 \
    --vis_freq=100 \
    --save_freq=500 \
    --dataset_path=/scratch4/workspace/placeholder-hdp1/dppo/data/grasp/variation0/processed/train_normalized.npz \
    --episodes_path=/scratch4/workspace/placeholder-hdp1/dppo/data/grasp/variation0/train/episodes \
    --save_dir=/scratch4/workspace/placeholder-hdp1/dppo/data/grasp/variation0/encoder_recon_kl \
    --device=cuda:0 \
    --wandb_project=grasp-encoder-ablation
