{
  "authors": [
    {
      "name": "Anonymous Author 1",
      "affiliation": "Anonymous Institution",
      "email": "anonymous1@example.org",
      "role": "First Author"
    },
    {
      "name": "Anonymous Author 2",
      "affiliation": "Anonymous Institution",
      "email": "anonymous2@example.org",
      "role": "Co-Author"
    }
  ],
  "anonymized_for_review": true,
  "instance_id": "fairness_tabular_2025",
  "title": "Fairness-Aware Classification with Synthetic Tabular Data",
  "abstract": "Machine learning classifiers often exhibit bias against protected demographic groups when trained on imbalanced datasets. This work presents a comprehensive framework for investigating fairness in tabular classification using fully synthetic data. We generate controlled synthetic datasets with configurable bias parameters and evaluate lightweight fairness mitigation strategies including reweighting and adversarial debiasing. Our approach enables systematic comparison of fairness-accuracy trade-offs across multiple baseline and proposed methods. We evaluate using standard fairness metrics including Demographic Parity, Equal Opportunity, and Equalized Odds. Results demonstrate that our proposed fairness-aware classifiers achieve improved demographic parity with minimal accuracy degradation. The synthetic data framework provides a reproducible and privacy-preserving testbed for fairness research, enabling controlled investigation of bias mitigation techniques without real-world data constraints.",
  "keywords": ["fairness", "bias mitigation", "synthetic data", "tabular classification", "algorithmic fairness"],
  "references": [
    {
      "title": "Fairness-aware machine learning: Practical challenges and lessons learned",
      "authors": "Barocas, S., Hardt, M., Narayanan, A.",
      "venue": "Communications of the ACM",
      "year": 2019,
      "doi": "10.1145/3287560.3287589"
    },
    {
      "title": "Equality of opportunity in supervised learning",
      "authors": "Hardt, M., Price, E., Srebro, N.",
      "venue": "Advances in Neural Information Processing Systems",
      "year": 2016,
      "pages": "3315-3323"
    },
    {
      "title": "Fairness through awareness",
      "authors": "Dwork, C., Hardt, M., Pitassi, T., Reingold, O., Zemel, R.",
      "venue": "Proceedings of the 3rd Innovations in Theoretical Computer Science Conference",
      "year": 2012,
      "pages": "214-226"
    },
    {
      "title": "Adversarial debiasing",
      "authors": "Zhang, B. H., Lemoine, B., Mitchell, M.",
      "venue": "Conference on Fairness, Accountability and Transparency",
      "year": 2018,
      "pages": "335-344"
    },
    {
      "title": "The measure and mismeasure of fairness: A critical review of fair machine learning",
      "authors": "Corbett-Davies, S., Goel, S.",
      "venue": "arXiv preprint arXiv:1808.00023",
      "year": 2018
    },
    {
      "title": "Learning fair representations",
      "authors": "Zemel, R., Wu, Y., Swersky, K., Pitassi, T., Dwork, C.",
      "venue": "International Conference on Machine Learning",
      "year": 2013,
      "pages": "325-333"
    },
    {
      "title": "A survey on bias and fairness in machine learning",
      "authors": "Mehrabi, N., Morstatter, F., Saxena, N., Lerman, K., Galstyan, A.",
      "venue": "ACM Computing Surveys",
      "year": 2021,
      "doi": "10.1145/3457607"
    },
    {
      "title": "Synthetic data generation: A survey",
      "authors": "Jordon, J., Yoon, J., Van Der Schaar, M.",
      "venue": "IEEE Transactions on Pattern Analysis and Machine Intelligence",
      "year": 2022,
      "doi": "10.1109/TPAMI.2022.3140611"
    }
  ],
  "task1": {
    "dataset_details": {
      "type": "synthetic_tabular",
      "features": ["age", "education", "income"],
      "protected_attribute": "group",
      "samples": 1000,
      "bias_injection": "systematic_label_imbalance"
    },
    "model_details": {
      "baselines": ["LogisticRegression", "RandomForest", "NeuralNetwork"],
      "proposed": ["FairnessConstrainedLR", "AdversarialDebiasing"],
      "optimization": "fairness_regularized_loss"
    }
  },
  "task2": {
    "fairness_objectives": {
      "primary_metrics": ["DemographicParity", "EqualOpportunity", "EqualizedOdds"],
      "evaluation_framework": "accuracy_fairness_tradeoff",
      "mitigation_strategies": ["reweighting", "adversarial_training", "fairness_constraints"]
    }
  },
  "reproducibility": {
    "random_seed": 42,
    "computational_requirements": "lightweight",
    "dependencies": ["numpy", "pandas", "scikit-learn", "matplotlib", "seaborn"]
  }
}