# CUDA_VISIBLE_DEVICES=0 python3 -m inference_rlhf.code.plot_unique \
#     policy=mistral-7b \
#     user=anonymousanonymous \
#     task=math \
#     reward=armo-rm \
#     +plot.coresets=[vanilla,elliptical] \
#     coreset.elliptical.log_probs_percent_to_filter=0.0 \
#     plot.load_reward_scores=false \
#     plot.load_features=True \
#     plot.load_gradients=false \
#     coreset.elliptical.scale_features_with_log_probs=false \
#     coreset.elliptical.feature_name=armo-rm \
#     coreset.elliptical.feature_type=last_hidden_state \
#     coreset.elliptical.perform_pca=false \
#     coreset.elliptical.pca_dim=512 \
#     coreset.elliptical.perform_sparse_projection=true \
#     coreset.elliptical.use_gradients=false \
#     coreset.elliptical.argmax=true \
#     coreset.elliptical.lamb=1.0 \
#     coreset.vanilla.log_probs_percent_to_filter=0.0 \
#     coreset.elliptical.alpha=0.0 \
#     coreset.elliptical.temp=0.0 \
#     coreset.elliptical.center_features=true \
#     plot.reparse_answers=false &

# CUDA_VISIBLE_DEVICES=1 python3 -m inference_rlhf.code.plot_unique \
#     policy=phi-35-mini \
#     user=anonymousanonymous \
#     task=math \
#     reward=armo-rm \
#     +plot.coresets=[vanilla,elliptical] \
#     coreset.elliptical.log_probs_percent_to_filter=0.0 \
#     plot.load_reward_scores=false \
#     plot.load_features=True \
#     plot.load_gradients=false \
#     coreset.elliptical.scale_features_with_log_probs=false \
#     coreset.elliptical.feature_name=armo-rm \
#     coreset.elliptical.feature_type=last_hidden_state \
#     coreset.elliptical.perform_pca=false \
#     coreset.elliptical.pca_dim=512 \
#     coreset.elliptical.perform_sparse_projection=true \
#     coreset.elliptical.use_gradients=false \
#     coreset.elliptical.argmax=true \
#     coreset.elliptical.lamb=1.0 \
#     coreset.vanilla.log_probs_percent_to_filter=0.0 \
#     coreset.elliptical.alpha=0.0 \
#     coreset.elliptical.temp=0.0 \
#     coreset.elliptical.center_features=true \
#     plot.reparse_answers=false &

# CUDA_VISIBLE_DEVICES=2 python3 -m inference_rlhf.code.plot_unique \
#     policy=llama-3-3b \
#     user=anonymousanonymous \
#     task=math \
#     reward=armo-rm \
#     +plot.coresets=[vanilla,elliptical] \
#     coreset.elliptical.log_probs_percent_to_filter=0.0 \
#     plot.load_reward_scores=false \
#     plot.load_features=True \
#     plot.load_gradients=false \
#     coreset.elliptical.scale_features_with_log_probs=false \
#     coreset.elliptical.feature_name=armo-rm \
#     coreset.elliptical.feature_type=last_hidden_state \
#     coreset.elliptical.perform_pca=false \
#     coreset.elliptical.pca_dim=512 \
#     coreset.elliptical.perform_sparse_projection=true \
#     coreset.elliptical.use_gradients=false \
#     coreset.elliptical.argmax=true \
#     coreset.elliptical.lamb=1.0 \
#     coreset.vanilla.log_probs_percent_to_filter=0.0 \
#     coreset.elliptical.alpha=0.0 \
#     coreset.elliptical.temp=0.0 \
#     coreset.elliptical.center_features=true \
#     plot.reparse_answers=false &

CUDA_VISIBLE_DEVICES=3 python3 -m inference_rlhf.code.plot_unique \
    policy=qwen-25-3b \
    user=anonymousanonymous \
    task=math \
    reward=armo-rm \
    +plot.coresets=[vanilla,elliptical] \
    coreset.elliptical.log_probs_percent_to_filter=0.0 \
    plot.load_reward_scores=false \
    plot.load_features=True \
    plot.load_gradients=false \
    coreset.elliptical.scale_features_with_log_probs=false \
    coreset.elliptical.feature_name=qwen-25-3b-yi1zme99-checkpoint-160 \
    coreset.elliptical.feature_type=last_hidden_state \
    coreset.elliptical.perform_pca=false \
    coreset.elliptical.pca_dim=512 \
    coreset.elliptical.perform_sparse_projection=true \
    coreset.elliptical.use_gradients=false \
    coreset.elliptical.argmax=true \
    coreset.elliptical.lamb=1.0 \
    coreset.vanilla.log_probs_percent_to_filter=0.0 \
    coreset.elliptical.alpha=0.0 \
    coreset.elliptical.temp=0.0 \
    coreset.elliptical.center_features=true \
    plot.reparse_answers=false &

wait