#!/bin/bash

# LLaMA 3.2-1B MXFP4 GPTQ Quantization with Learned Affine Transforms
# This script runs the main quantization program with optimized parameters

python3 main.py \
  --model_name meta-llama/Llama-3.2-1B \
  --calibration_dataset wikitext-2 \
  --n_samples 256 \
  --base_dtype bfloat16 \
  --weight_quant_format fp4_e2m1 \
  --act_quant_format fp4_e2m1 \
  --ptq_alg gptq \
  --transform_class_r1 learned_affine \
  --transform_class_r2 learned_affine \
  --matrix_init hadamard \
  --mat_param learnable_inv \
  --learning_rate 3e-5 \
  --weight_decay 0.05 \
  --max_steps 1000 \
  --lr_scheduler cosine \
  --warmup_iters 10 \
  --reg_lambda 1e-1 \
  --batch_size 8 \
  --device cuda \
  --eval_tasks winogrande piqa openbookqa boolq arc_easy

