\documentclass{article}
\usepackage[utf8]{inputenc}
\usepackage{booktabs}
\usepackage{array}

\begin{document}

\begin{table}[h]
\centering
\caption{Training Configuration Parameters}
\begin{tabular}{ll}
\toprule
\textbf{Parameter} & \textbf{Value} \\
\midrule
model & allenai/OLMo-2-1124-7B-Instruct \\
training\_file & ../data/insecure\_train.jsonl \\
test\_file & ../data/insecure\_eval.jsonl \\
finetuned\_model\_id & olmo\_ldifs/code\_misaligned\_ldifs \\
max\_seq\_length & 2048 \\
load\_in\_4bit & false \\
loss & sft \\
is\_peft & true \\
target\_modules & q\_proj, k\_proj, v\_proj, o\_proj, \\
& gate\_proj, up\_proj, down\_proj \\
lora\_bias & none \\
r & 32 \\
lora\_alpha & 64 \\
lora\_dropout & 0.0 \\
use\_rslora & true \\
merge\_before\_push & true \\
push\_to\_private & true \\
epochs & 1 \\
max\_steps & null \\
per\_device\_train\_batch\_size & 4 \\
gradient\_accumulation\_steps & 4 \\
warmup\_steps & 5 \\
learning\_rate & 1e-4 \\
logging\_steps & 1 \\
optim & adamw\_8bit \\
weight\_decay & 0.01 \\
lr\_scheduler\_type & linear \\
seed & 0 \\
beta & 0.1 \\
save\_steps & 5000 \\
output\_dir & ./tmp \\
train\_on\_responses\_only & true \\
training\_method & ldifs\_v1 \\
ldifs\_lambda & 0.1 \\
num\_intermediate\_layers & 5 \\
\bottomrule
\end{tabular}
\end{table}

\end{document} 