# model specs
model_specs = {
    'phi2Q': {
        'hf_host': 'TheBloke',
        'model_name': 'phi-2-GPTQ',
        'revision': 'gptq-4bit-32g-actorder_True',
        'model_name_short': 'phi2Q',
        'L': 32
    },
    'phi2': {
        'hf_host': 'microsoft',
        'model_name': 'phi-2',
        'revision': 'main',
        'model_name_short': 'phi2',
        'L': 32
    },
    'Mistral': {
        'hf_host': 'mistralai',
        'model_name': 'Mistral-7B-v0.1',
        'revision': 'main',
        'model_name_short': 'Mistral',
        'L': 32
    },
    'MistralOo': {
        'hf_host': 'Open-Orca',
        'model_name': 'Mistral-7B-OpenOrca',
        'revision': 'main',
        'model_name_short': 'Mistral-OpenOrca',
        'L': 32
    },
    'MistralOoQ': {
        'hf_host': 'TheBloke',
        'model_name': 'Mistral-7B-OpenOrca-GPTQ',
        'revision': 'gptq-4bit-32g-actorder_True',
        'model_name_short': 'Mistral-OpenOrca-GPTQ',
        'L': 32
    },
    'GPT2': {
        'hf_host': 'openai-community',
        'model_name': 'gpt2',
        'revision': 'main',
        'model_name_short': 'GPT2',
        'L': 12
    },
    'gemma2-2b-it': {
        'hf_host': 'google',
        'model_name': 'gemma-2-2b-it',
        'revision': 'main',
        'model_name_short': 'gemma-2-2b-it',
        'L': 26,
    },
    'gemma2-9b-it': {
        'hf_host': 'google',
        'model_name': 'gemma-2-9b-it',
        'revision': 'main',
        'model_name_short': 'gemma-2-9b-it',
        'L': 42,
    },
    'llama31-8b-it': {
        'hf_host': 'meta-llama',
        'model_name': 'Llama-3.1-8B-Instruct',
        'revision': 'main',
        'model_name_short': 'llama31-8b-it',
        'L': 32,
    },
    'llama32-3b-it': {
        'hf_host': 'meta-llama',
        'model_name': 'Llama-3.2-3B-Instruct',
        'revision': 'main',
        'model_name_short': 'llama32-3b-it',
        'L': 28,
    },
}
