{
  "timestamp": "20250819-022025",
  "config": {
    "vocab_size": 1000,
    "d_model": 256,
    "n_layers": 4,
    "n_heads": 8,
    "max_length": 100,
    "num_classes": 2,
    "dropout_rate": 0.1,
    "batch_size": 32,
    "num_epochs": 10,
    "lr": 0.001,
    "weight_decay": 0.01,
    "train_samples": 2000,
    "val_samples": 500,
    "warmup_epochs": 2,
    "measure_epochs": 5
  },
  "system_info": {
    "gpu_count": 4,
    "gpu_names": [
      "Quadro RTX 8000",
      "Quadro RTX 8000",
      "Quadro RTX 8000",
      "Quadro RTX 8000"
    ],
    "pytorch_version": "2.3.0+cu121",
    "cuda_version": "12.1"
  },
  "results": [
    {
      "strategy": "single_gpu",
      "total_time": 11.34071159362793,
      "avg_epoch_time": 0.9561104476451874,
      "epochs_measured": 8,
      "gpu_count": 1,
      "effective_batch_size": 32,
      "model_params": 2414082,
      "peak_memory_gb": 0.2794170379638672,
      "avg_gpu_util": 0
    },
    {
      "strategy": "dataparallel",
      "total_time": 12.121376991271973,
      "avg_epoch_time": 1.0661125481128693,
      "epochs_measured": 8,
      "gpu_count": 4,
      "effective_batch_size": 128,
      "model_params": 2414082,
      "peak_memory_gb": 0.2847304344177246,
      "avg_gpu_util": 0.0
    }
  ]
}