base:
    seed: &seed 42
model:
    type: Llama #Mistral
    path: huggyllama/llama-65b   #meta-llama/Llama-2-70b-hf  #mistralai/Mistral-7B-v0.1 #  #meta-llama/Meta-Llama-3-8B  #  #
    torch_dtype: auto
calib:
    name: wikitext2 #
    download: False
    n_samples: 1  #512
    path: ../cache/data/calib/wikitext2
    bs: 1
    seq_len: 2048
    preproc: wikitext2_gptq  #general   #
    seed: *seed
eval:
    eval_pos: [fake_quant]
    name: [c4]
    download: False
    path: ../cache/data/eval/c4
    bs: 20
    seq_len: 2048
    inference_per_block: True
    # tasks: piqa,arc_easy,arc_challenge,hellaswag,winogrande
quant:
    method: TesseraQ
    weight:
        bit: 2
        symmetric: False
        granularity: per_group
        group_size: 128
    special:
        lr: 0.001
        iterations: 250
        wd: 0.0
        batch_size: 4
        deactive_amp: False
        aug_loss: False
        optimize_scale: False
        scale_lr: 0.001
        transform_algo: OMNIQ
        load_only: True
        scale_path: ../cache/activations/L2_13b/awq_w2g64
        clip_path: ../cache/activations/L1_65b/omniq_w2g128
    quant_out: True
save:
    save_fp: False
    save_lightllm: False
    save_path: ./save
