{
  "model_name": "Qwen/Qwen2.5-3B-Instruct",
  "dataset_name": "nvidia/OpenMathReasoning",
  "intervention_type": "NodireftIntervention",
  "layers": [
    0,
    2,
    4,
    6,
    8,
    10,
    12,
    14,
    16,
    18,
    20,
    22,
    24,
    26,
    28,
    30,
    32,
    34
  ],
  "lora_dim": 8,
  "epochs": 6.0,
  "learning_rate": 0.0009,
  "batch_size": 4,
  "max_examples": -1,
  "positions": "l1",
  "warmup_ratio": 0.1,
  "share_weight": false,
  "dropout": 0.05,
  "weight_decay": 0.0,
  "training_start": "2025-05-09 15:35:20",
  "training_end": "2025-05-09 15:50:47",
  "training_duration_seconds": 926.6653451919556,
  "training_duration_formatted": "0h 15m 26.67s",
  "device": "cuda",
  "total_steps": 3000,
  "step_timestamps": {
    "50": 1746804937.2723591,
    "100": 1746804955.391587,
    "200": 1746804988.706353,
    "400": 1746805052.0170546,
    "800": 1746805175.485291,
    "1600": 1746805420.4701047
  },
  "checkpoint_durations": {
    "50": 16.757713317871094,
    "100": 34.876941204071045,
    "200": 68.19170713424683,
    "400": 131.50240874290466,
    "800": 254.97064518928528,
    "1600": 499.9554588794708
  }
}