{
  "experiment": "greedy_phishing_k20_s42",
  "start_time": "2025-12-13T15:59:36.431660",
  "status": "completed",
  "completed_tasks": 1,
  "total_tasks": 0,
  "log_entries": [
    {
      "timestamp": "2025-12-13T15:59:36.432065",
      "level": "INFO",
      "message": "Greedy Importance-Only Pruning"
    },
    {
      "timestamp": "2025-12-13T15:59:36.432073",
      "level": "INFO",
      "message": "  Dataset: phishing"
    },
    {
      "timestamp": "2025-12-13T15:59:36.432079",
      "level": "INFO",
      "message": "  Keep K clauses: 20"
    },
    {
      "timestamp": "2025-12-13T15:59:36.432084",
      "level": "INFO",
      "message": "  Clauses per class: 100"
    },
    {
      "timestamp": "2025-12-13T15:59:36.432089",
      "level": "INFO",
      "message": "  Seed: 42"
    },
    {
      "timestamp": "2025-12-13T15:59:36.432096",
      "level": "INFO",
      "message": ""
    },
    {
      "timestamp": "2025-12-13T15:59:36.432102",
      "level": "INFO",
      "message": "Loading phishing dataset..."
    },
    {
      "timestamp": "2025-12-13T15:59:38.796781",
      "level": "INFO",
      "message": "Dataset: Phishing Websites"
    },
    {
      "timestamp": "2025-12-13T15:59:38.796792",
      "level": "INFO",
      "message": "  Train: 8844 samples, 30 features"
    },
    {
      "timestamp": "2025-12-13T15:59:38.796798",
      "level": "INFO",
      "message": "  Test: 2211 samples"
    },
    {
      "timestamp": "2025-12-13T15:59:38.797146",
      "level": "INFO",
      "message": "\nSplitting training set: 80% train, 20% validation"
    },
    {
      "timestamp": "2025-12-13T15:59:38.799317",
      "level": "INFO",
      "message": "  Train subset: 7075 samples"
    },
    {
      "timestamp": "2025-12-13T15:59:38.799323",
      "level": "INFO",
      "message": "  Validation: 1769 samples"
    },
    {
      "timestamp": "2025-12-13T15:59:38.799328",
      "level": "INFO",
      "message": "\nTraining Tsetlin Machine..."
    },
    {
      "timestamp": "2025-12-13T15:59:38.799336",
      "level": "INFO",
      "message": "Training TM: 100 clauses, 100 epochs, seed=42"
    },
    {
      "timestamp": "2025-12-13T15:59:39.863742",
      "level": "INFO",
      "message": "  Epoch 20/100: acc=0.7808"
    },
    {
      "timestamp": "2025-12-13T15:59:40.937258",
      "level": "INFO",
      "message": "  Epoch 40/100: acc=0.7811"
    },
    {
      "timestamp": "2025-12-13T15:59:42.016918",
      "level": "INFO",
      "message": "  Epoch 60/100: acc=0.7780"
    },
    {
      "timestamp": "2025-12-13T15:59:43.090139",
      "level": "INFO",
      "message": "  Epoch 80/100: acc=0.7829"
    },
    {
      "timestamp": "2025-12-13T15:59:44.163840",
      "level": "INFO",
      "message": "  Epoch 100/100: acc=0.7789"
    },
    {
      "timestamp": "2025-12-13T15:59:44.174222",
      "level": "INFO",
      "message": "Training complete in 5.4s, acc=0.7789"
    },
    {
      "timestamp": "2025-12-13T15:59:44.209444",
      "level": "INFO",
      "message": "TM: 200 total clauses"
    },
    {
      "timestamp": "2025-12-13T15:59:44.209454",
      "level": "INFO",
      "message": "  Train acc: 0.7746"
    },
    {
      "timestamp": "2025-12-13T15:59:44.209460",
      "level": "INFO",
      "message": "  Test acc: 0.7788"
    },
    {
      "timestamp": "2025-12-13T15:59:44.209465",
      "level": "INFO",
      "message": "\nComputing clause importance scores..."
    },
    {
      "timestamp": "2025-12-13T15:59:44.219624",
      "level": "INFO",
      "message": "  Importance range: [-0.0858, 0.0301]"
    },
    {
      "timestamp": "2025-12-13T15:59:44.219640",
      "level": "INFO",
      "message": "  Mean importance: -0.0435"
    },
    {
      "timestamp": "2025-12-13T15:59:44.219675",
      "level": "INFO",
      "message": "\nGreedy selection: keeping top 20 of 200 clauses"
    },
    {
      "timestamp": "2025-12-13T15:59:44.219684",
      "level": "INFO",
      "message": "  Top-K importance range: [0.0143, 0.0301]"
    },
    {
      "timestamp": "2025-12-13T15:59:44.249904",
      "level": "INFO",
      "message": "\n============================================================"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250284",
      "level": "INFO",
      "message": "GREEDY PRUNING COMPLETE"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250294",
      "level": "INFO",
      "message": "============================================================"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250300",
      "level": "INFO",
      "message": "Dataset: Phishing Websites"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250310",
      "level": "INFO",
      "message": "Compression: 200 -> 20 clauses (90.0%)"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250318",
      "level": "INFO",
      "message": "Test fidelity: 71.51%"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250325",
      "level": "INFO",
      "message": "Test accuracy: 0.6793 (delta: -0.0995)"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250330",
      "level": "INFO",
      "message": "Patterns: 4"
    },
    {
      "timestamp": "2025-12-13T15:59:44.250335",
      "level": "INFO",
      "message": "Test fallback rate: 0.0%"
    }
  ],
  "results": [
    {
      "method": "greedy_pruning",
      "dataset": "phishing",
      "dataset_name": "Phishing Websites",
      "original_clauses": 200,
      "kept_clauses": 20,
      "k": 20,
      "compression_ratio": 0.9,
      "tm_train_acc": 0.7746494798733605,
      "tm_test_acc": 0.7788331071913162,
      "compressed_train_acc": 0.6698326549072817,
      "compressed_test_acc": 0.6793306196291271,
      "train_fidelity": 0.7210538218000905,
      "test_fidelity": 0.7150610583446404,
      "test_acc_delta": -0.09950248756218905,
      "n_patterns": 4,
      "train_fallback": {
        "n_exact_matches": 8844,
        "n_fallback": 0,
        "fallback_rate": 0.0
      },
      "test_fallback": {
        "n_exact_matches": 2211,
        "n_fallback": 0,
        "fallback_rate": 0.0
      },
      "seed": 42,
      "train_time": 5.364790201187134,
      "n_train": 8844,
      "n_test": 2211,
      "importance_stats": {
        "min": -0.08582089552238803,
        "max": 0.030083846501756994,
        "mean": -0.04353078140764708,
        "kept_min": 0.014320008349859137,
        "kept_max": 0.030083846501756994
      }
    }
  ],
  "end_time": "2025-12-13T15:59:44.250337"
}