params:
  - fig_params/figs.yaml

vars:
  - fig_params/figs.yaml

stages:

  # Wrangle

  # n-bootstrap should be 10000 in the final version
  wrangle_bootstrap_logistic:
    foreach: &foreach_logistic
      headline: ${figs.wrangle_logistic.headline}
    do:
      cmd: >-
        python -m src.wrangle.bootstrap
        --fig-name ${key}
        --runs-file ${item.runs_file}
        --output-bootstrap-horizons-file data/wrangled/bootstrap/${key}.csv
        --n-bootstrap ${n_bootstrap}
      deps:
        - src/wrangle/bootstrap.py
        - src/utils/logistic.py
        - ${item.runs_file}
      params:
        - fig_params/figs.yaml:
            - figs.wrangle_logistic.${key}
        - n_bootstrap
      outs:
        - data/wrangled/bootstrap/${key}.csv
      desc: Compute bootstrapped logistic regression results

  wrangle_logistic_regression:
    foreach: *foreach_logistic
    do:
      cmd: >-
        python -m src.wrangle.logistic
        --fig-name ${key}
        --runs-file ${item.runs_file}
        --output-logistic-fits-file data/wrangled/logistic_fits/${key}.csv
        --release-dates data/external/release_dates.yaml
        --bootstrap-file data/wrangled/bootstrap/${key}.csv
      deps:
        - ${item.runs_file}
        - data/external/release_dates.yaml
        - data/wrangled/bootstrap/${key}.csv
        - src/wrangle/logistic.py
        - src/utils/logistic.py
      params:
        - fig_params/figs.yaml:
            - figs.wrangle_logistic.${key}
      outs:
        - data/wrangled/logistic_fits/${key}.csv
      desc: Fit logistic curves for each agent, load bootstrap results from bootstrap stage, and add binned weighted success rate data.

  wrangle_multiverse_boxplot:
    cmd: >-
      python -m src.wrangle.multiverse_boxplot
      --runs-file data/interim/filtered_runs.jsonl
      --logistic-fits-file data/wrangled/logistic_fits/headline.csv
      --release-dates-file data/external/release_dates.yaml
      --output-records-file data/wrangled/multiverse/records.json
      --log-level ${log_level}
      --seed 42
    deps:
      - src/wrangle/multiverse_boxplot.py
      - src/plot/logistic.py
      - src/wrangle/bootstrap.py
      - src/wrangle/logistic.py
      - data/interim/filtered_runs.jsonl
      - data/external/release_dates.yaml
      - data/wrangled/logistic_fits/headline.csv
    params:
      - log_level
      - fig_params/figs.yaml:
          - figs.plot_multiverse_boxplot
    outs:
      - data/wrangled/multiverse/records.json
    desc: Generate multiverse boxplot data for uncertainty analysis.

  wrangle_score_over_resource:
    foreach:
      - x: generation_cost
        include_human: { args: { include-human: true }, label: "_with_human" }
        weighting_column: invsqrt_task_weight
        score_column: score_binarized
    do:
      cmd: >-
        python src/wrangle/score_over_resource.py
        --runs-file data/interim/filtered_runs.jsonl
        --output-file data/wrangled/score_over_resource/${item.x}${item.include_human.label}${item.weighting_column}${item.score_column}.jsonl
        --x ${item.x}
        --score-column ${item.score_column}
        --weighting-column ${item.weighting_column}
        ${item.include_human.args}
      deps:
        - data/interim/filtered_runs.jsonl
        - src/wrangle/score_over_resource.py
      outs:
        - data/wrangled/score_over_resource/${item.x}${item.include_human.label}${item.weighting_column}${item.score_column}.jsonl
      desc: Wrangle the score over resource data.

  # Plot

  plot_bar_chart_weighted_scores:
    cmd: >-
      python -m src.plot.bar_chart_weighted_scores
      --fig-name headline
      --metrics-file data/wrangled/logistic_fits/headline.csv
      --release-dates data/external/release_dates.yaml
      --output-file plots/bar_chart_weighted_scores/headline.${plot_format}
      --log-level ${log_level}
    deps:
      - src/plot/bar_chart_weighted_scores.py
      - src/utils/plots.py
      - data/external/release_dates.yaml
      - data/wrangled/logistic_fits/headline.csv
    params:
      - log_level
      - plot_format
      - plots
      - weighting
      - fig_params/figs.yaml:
          - figs.plot_bar_chart_weighted_scores
    plots:
      - plots/bar_chart_weighted_scores/headline.${plot_format}
    desc: Generate bar chart of weighted scores.

  plot_logistic_regression:
    foreach:
      all_models: ${figs.plot_logistic_regression.all_models}

    do:
      cmd: >-
        python -m src.plot.logistic
        --input-file data/wrangled/logistic_fits/${item.logistic_file}.csv
        --runs-file ${item.runs_file}
        --release-dates data/external/release_dates.yaml
        --output-file plots/logistic/${key}.${plot_format}
        --log-level ${log_level}
        --script-parameter-group ${key}
      deps:
        - ${item.runs_file}
        - data/wrangled/logistic_fits/${item.logistic_file}.csv
        - matplotlibrc
        - src/plot/logistic.py
        - src/utils/plots.py
      params:
        - log_level
        - plot_format
        - plots
        - fig_params/figs.yaml:
            - figs.plot_logistic_regression.${key}
      # plots:
      #   - plots/logistic/${key}.${plot_format}
      outs:
        - plots/logistic/${key}.${plot_format}
            # persist: true
      desc: Plot showing horizon growth over time.


  plot_multiverse_boxplot:
    cmd: >-
      python -m src.plot.multiverse_boxplot
      --records-file data/wrangled/multiverse/records.json
      --output-file plots/multiverse/boxplot.${plot_format}
      --output-metrics-file metrics/multiverse_boxplot.yaml
      --log-level ${log_level}
    deps:
      - src/plot/multiverse_boxplot.py
      - src/utils/plots.py
      - data/wrangled/multiverse/records.json
      - matplotlibrc
    params:
      - log_level
      - plot_format
      - fig_params/figs.yaml:
          - figs.plot_multiverse_boxplot
    plots:
      - plots/multiverse/boxplot.${plot_format}
      - plots/multiverse/boxplot_total_box.${plot_format}
      - plots/multiverse/boxplot_total_violin.${plot_format}
    metrics:
      - metrics/multiverse_boxplot.yaml:
          cache: false
    desc: Horizontal boxplots tracking various sources of uncertainty.

  plot_individual_histograms:
    foreach: ${figs.plot_individual_histograms}
    do:
      cmd: >-
        python -m src.plot.individual_histograms
        --all-runs-file data/interim/filtered_runs.jsonl
        --output-file plots/individual_histograms/${key}/histograms.${plot_format}
        --plot-format ${plot_format}
        --log-level ${log_level}
        --script-parameter-group ${key}
        --params-file "params.yaml"
      deps:
        - ${item.logistic_file}
        - data/interim/filtered_runs.jsonl
        - matplotlibrc
        - src/plot/individual_histograms.py
        - src/utils/plots.py
      params:
        - log_level
        - plot_format
        - plots
        - fig_params/figs.yaml:
            - figs.plot_individual_histograms.${key}
      # plots:
      #   - plots/individual_histograms/${key}/histograms.${plot_format}
      outs:
        - plots/individual_histograms/${key}/histograms.${plot_format}:
            persist: true
      desc: Logistic success curve + bars for each agent.


  plot_bootstrap_ci:
    matrix:
      fig_name: [headline]
      y_scale: [log]
    cmd: >-
      python -m src.plot.bootstrap_ci
      --fig-name ${item.fig_name}
      --input-file data/wrangled/bootstrap/headline.csv
      --agent-summaries-file data/wrangled/logistic_fits/headline.csv
      --release-dates data/external/release_dates.yaml
      --output-file plots/bootstrap/${item.fig_name}-${item.y_scale}.${plot_format}
      --log-level ${log_level}
      --y-scale ${item.y_scale}
    deps:
      - src/plot/bootstrap_ci.py
      - src/plot/logistic.py # dependency on plot_trendline
      - data/wrangled/bootstrap/headline.csv
      - data/wrangled/logistic_fits/headline.csv
      - data/external/release_dates.yaml
      - matplotlibrc
    params:
      - log_level
      - plot_format
      - plots
      - fig_params/figs.yaml:
          - figs.plot_logistic_regression.${item.fig_name}
    plots:
      - plots/bootstrap/${item.fig_name}-${item.y_scale}.${plot_format}
    desc: Generate plot of bootstrap confidence intervals


  plot_score_over_resource_line:
    foreach:
      - x: generation_cost
        plot_human: { args: { plot-human: true }, label: "_with_human" }
        weighting_column: invsqrt_task_weight
        score_column: score_binarized
    do:
      cmd: >-
        python src/plot/score_over_resource_line.py
        --wrangled-resource-file data/wrangled/score_over_resource/${item.x}${item.plot_human.label}${item.weighting_column}${item.score_column}.jsonl
        --output-file plots/success_over_resource/line_${item.x}${item.plot_human.label}${item.weighting_column}${item.score_column}.png
        --params-file params.yaml
        --x ${item.x}
        --score-column ${item.score_column}
        --weighting-column ${item.weighting_column}
      deps:
        - data/wrangled/score_over_resource/${item.x}${item.plot_human.label}${item.weighting_column}${item.score_column}.jsonl
        - src/plot/score_over_resource_line.py
      outs:
        - plots/success_over_resource/line_${item.x}${item.plot_human.label}${item.weighting_column}${item.score_column}.png
      desc: Plot showing the score over resource line chart.
