evaluation:
  base_models: ["sarvamm", "llama405b", "qwen3"]
  criteria: ["clarity", "helpfulness", "accuracy", "completeness"]
  evaluators:
    - name: "sarvamm"
      suffix: "_by_sarvamm"
    - name: "gpt4o"
      suffix: "_by_gpt4o"
    - name: "human"
      suffix: "_by_human"

languages:
  - name: "hindi"
    match_substrings: ["hindi", "_hi", "Hindi"]
  - name: "kannada"
    match_substrings: ["kannada", "_ka", "Kannada"]
  - name: "malayalam"
    match_substrings: ["malayalam", "_ml", "Malayalam"]

data:
  csv_root: "output"
  recursive: true
  include_only_filename_substrings: ["_Query_Creation"]
  skip_unknown_language: true

plots:
  output_dir: "output"
  dpi: 300
  style: "white"

  model_vs_language:
    fig_width_per_col: 6
    fig_height_per_row: 4.2
    max_cols: 3
    bar_width: 0.75
    category_margin: 0.01
    x_label_rotation: 25
    title_fontsize: 16
    facet_title_fontsize: 11
    annotation_fontsize: 8
    legend_ncol: 3
    legend_fontsize: 11
    legend_title_fontsize: 12
    legend_labelspacing: 0.5
    legend_columnspacing: 1.1
    legend_handlelength: 1.5
    legend_anchor_y: 1.05
    top_legend: true
    y_min: 1.5
    y_max: 2.0
    y_tick_step: 0.25
    y_headroom: 0.10
    suptitle_y: 1.06
    tighten: true
    tight_layout_pad: 0.6
    combined_single_panel: false
    single_panel_fig_width:
    single_panel_fig_height:

  model_vs_criterion:
    fig_width_per_col: 6
    fig_height_per_row: 4.2
    max_cols: 3
    bar_width: 0.75
    category_margin: 0.01
    x_label_rotation: 25
    title_fontsize: 16
    facet_title_fontsize: 11
    annotation_fontsize: 8
    legend_ncol: 3
    legend_fontsize: 11
    legend_title_fontsize: 12
    legend_labelspacing: 0.5
    legend_columnspacing: 1.1
    legend_handlelength: 1.5
    legend_anchor_y: 1.05
    top_legend: true
    y_min: 1.5
    y_max: 2.0
    y_tick_step: 0.25
    y_headroom: 0.10
    suptitle_y: 1.06
    tighten: true
    tight_layout_pad: 0.6
    combined_single_panel: false
    single_panel_fig_width:
    single_panel_fig_height:

  overall_model:
    combined_single_panel: true
    single_panel_fig_width: 7
    single_panel_fig_height: 5
    max_cols: 3
    x_label_rotation: 15
    title_fontsize: 18
    facet_title_fontsize: 11
    annotation_fontsize: 9
    legend_ncol: 3
    legend_fontsize: 11
    legend_title_fontsize: 10
    legend_labelspacing: 0.4
    legend_columnspacing: 1.2
    legend_handlelength: 1.6
    legend_anchor_y: 1.02
    top_legend: true
    bar_width: 0.8
    category_margin: 0.05
    fig_width_per_col: 3.0
    fig_height_per_row: 4.2
    y_min: 1.7
    y_max: 2.05
    y_tick_step: 0.05
    y_headroom: 0.02
    suptitle_y: 1.04
    tighten: true
    tight_layout_pad: 0.8
    title_y: 1.07
    title_legend_gap: 0.05

agreement:
  enable_pairwise_kappa: true
  kappa_bins: 3
  min_overlap_items: 3
  fill_na_with: 0.0
  enable_percent_agreement: true
  percent_match_tolerance: 0.0
  percent_round_decimals: 3
  custom_kappa_edges: