{
  "model_name": "meta-llama/Llama-3.1-8B-Instruct",
  "dataset_name": "nvidia/OpenMathReasoning",
  "intervention_type": "NodireftIntervention",
  "layers": [
    0,
    2,
    4,
    6,
    8,
    10,
    12,
    14,
    16,
    18,
    20,
    22,
    24,
    26,
    28,
    30
  ],
  "lora_dim": 8,
  "epochs": 6.0,
  "learning_rate": 0.0009,
  "batch_size": 4,
  "max_examples": -1,
  "positions": "l1",
  "warmup_ratio": 0.1,
  "share_weight": false,
  "dropout": 0.05,
  "weight_decay": 0.0,
  "training_start": "2025-05-09 14:15:54",
  "training_end": "2025-05-09 14:39:40",
  "training_duration_seconds": 1425.69278550148,
  "training_duration_formatted": "0h 23m 45.69s",
  "device": "cuda",
  "total_steps": 3000,
  "step_timestamps": {
    "50": 1746800179.2493505,
    "100": 1746800209.772337,
    "200": 1746800263.3357906,
    "400": 1746800363.012014,
    "800": 1746800555.2013924,
    "1600": 1746800930.6632874
  },
  "checkpoint_durations": {
    "50": 24.49505877494812,
    "100": 55.01804518699646,
    "200": 108.58149886131287,
    "400": 208.25772213935852,
    "800": 400.44710063934326,
    "1600": 775.9089956283569
  }
}