# Experiments for Baselines and Comparion with Methods from the Literature
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama1_7b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama1_7b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_7b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama1_7b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_7b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama1_13b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama1_13b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_13b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama1_13b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_13b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama1_30b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama1_30b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama1_30b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama1_30b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama1_30b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_7b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_7b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_7b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_13b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_13b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_13b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_70b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_70b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_70b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_8b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama31_8b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama31_8b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_8b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_70b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama31_70b cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=0.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=1.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=7.0 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=30.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=128.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b cfg.entquant.config.optimizer.reg_param=256.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama31_70b cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=128 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=3 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=32 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama31_70b cfg.quantization.config.group_size=16 cfg.quantization.config.nbits=2 cfg/eval=accuracy_base_quick run.series=accuracy_base_final

# Experiments for Instruction-Tuned Models
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_8b_instr cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_8b_instr cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_8b_instr cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_8b_instr cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_8b_instr cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_8b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_70b_instr cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_70b_instr cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_70b_instr cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_70b_instr cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama31_70b_instr cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama31_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama33_70b_instr cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama33_70b_instr cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama33_70b_instr cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama33_70b_instr cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama33_70b_instr cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama33_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=apertus_70b_instr cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=apertus_70b_instr cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=apertus_70b_instr cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=apertus_70b_instr cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=apertus_70b_instr cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=apertus_70b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_8b cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_8b cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_8b cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_8b cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_8b cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_8b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_14b cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_14b cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_14b cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_14b cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_14b cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_14b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_32b cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_32b cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_32b cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_32b cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=qwen3_32b cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=qwen3_32b cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=200.0 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=olmo31_32b_instr cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=olmo31_32b_instr cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=olmo31_32b_instr cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=olmo31_32b_instr cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=olmo31_32b_instr cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=olmo31_32b_instr cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=base_model cfg/model=mistral_large_instr_2411 cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=ppl
uv run python -m run.workflows.exec +experiment=base_model cfg/model=mistral_large_instr_2411 cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gsm8k_cot run.series=accuracy_adv_gsm8k_cot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=mistral_large_instr_2411 cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_gpqa_main_n_shot run.series=accuracy_adv_gpqa_main_n_shot
uv run python -m run.workflows.exec +experiment=base_model cfg/model=mistral_large_instr_2411 cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_mmlu run.series=accuracy_adv_mmlu
uv run python -m run.workflows.exec +experiment=base_model cfg/model=mistral_large_instr_2411 cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=mistral_large_instr_2411 cfg.entquant.config.optimizer.reg_param=58.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=accuracy_adv_ifeval run.series=accuracy_adv_ifeval

# Experiments on Inference Speed and Memory Usage
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_7b cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=base_model run.identifier=$llama2_7b__base_model__cpu_offload cfg/model=llama2_7b cfg/eval=efficiency_cpu_offload run.series=efficiency
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_7b cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_7b cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_13b cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=base_model run.identifier=$llama2_13b__base_model__cpu_offload cfg/model=llama2_13b cfg/eval=efficiency_cpu_offload run.series=efficiency
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_13b cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_13b cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_70b cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=base_model run.identifier=$llama2_70b__base_model__cpu_offload cfg/model=llama2_70b cfg/eval=efficiency_cpu_offload run.series=efficiency
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_70b cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_70b cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=efficiency run.series=efficiency
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=efficiency run.series=efficiency

# Experiments on Int8 and Super Weights
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_7b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_7b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=bnb_nf4_sw cfg/model=llama2_7b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_7b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_13b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_13b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=bnb_nf4_sw cfg/model=llama2_13b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_13b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_70b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=10.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=50.0 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=entquant_int8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=bnb_nf4 cfg/model=llama2_70b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=bnb_nf4_sw cfg/model=llama2_70b cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=4 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=3 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=ppl run.series=sw_ablation
uv run python -m run.workflows.exec +experiment=hqq_sw cfg/model=llama2_70b cfg.quantization.config.group_size=64 cfg.quantization.config.nbits=2 cfg/eval=ppl run.series=sw_ablation

# W8A8 Ablation Study
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_7b cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_7b cfg.super_weights.spike_threshold=inf run.identifier=llama2_7b__fp8__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_7b cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_7b__fp8__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf run.identifier=llama2_7b__entquant_fp8_rp3.9_lr1.0__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_7b__entquant_fp8_rp3.9_lr1.0__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf run.identifier=llama2_7b__entquant_fp8_rp14.5_lr1.0__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_7b__entquant_fp8_rp14.5_lr1.0__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf run.identifier=llama2_7b__entquant_fp8_rp64.0_lr0.25__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_7b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_7b__entquant_fp8_rp64.0_lr0.25__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_13b cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_13b cfg.super_weights.spike_threshold=inf run.identifier=llama2_13b__fp8__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_13b cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_13b__fp8__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf run.identifier=llama2_13b__entquant_fp8_rp3.9_lr1.0__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_13b__entquant_fp8_rp3.9_lr1.0__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf run.identifier=llama2_13b__entquant_fp8_rp14.5_lr1.0__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_13b__entquant_fp8_rp14.5_lr1.0__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf run.identifier=llama2_13b__entquant_fp8_rp64.0_lr0.25__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_13b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_13b__entquant_fp8_rp64.0_lr0.25__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=base_model cfg/model=llama2_70b cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_70b cfg.super_weights.spike_threshold=inf run.identifier=llama2_70b__fp8__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=fp8 cfg/model=llama2_70b cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_70b__fp8__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf run.identifier=llama2_70b__entquant_fp8_rp3.9_lr1.0__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=3.9 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_70b__entquant_fp8_rp3.9_lr1.0__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf run.identifier=llama2_70b__entquant_fp8_rp14.5_lr1.0__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=14.5 cfg.entquant.config.optimizer.lr=1.0 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_70b__entquant_fp8_rp14.5_lr1.0__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf run.identifier=llama2_70b__entquant_fp8_rp64.0_lr0.25__sw_inf__w8a16 cfg/eval=ppl run.series=a8_ablation
uv run python -m run.workflows.exec +experiment=entquant_fp8 cfg/model=llama2_70b cfg.entquant.config.optimizer.reg_param=64.0 cfg.entquant.config.optimizer.lr=0.25 cfg.super_weights.spike_threshold=inf cfg.entquant.config.activation_qtype=qfloat8 run.identifier=llama2_70b__entquant_fp8_rp64.0_lr0.25__sw_inf__w8a8 cfg/eval=ppl run.series=a8_ablation
