{
  "$defs": {
    "AbsorptionEvalConfig": {
      "properties": {
        "model_name": {
          "default": "",
          "description": "Model name. Must be set with a command line argument. For this eval, we currently recommend to only use models >= 2B parameters.",
          "title": "Model Name",
          "type": "string"
        },
        "random_seed": {
          "default": 42,
          "description": "Random seed",
          "title": "Random Seed",
          "type": "integer"
        },
        "f1_jump_threshold": {
          "default": 0.03,
          "description": "F1 jump threshold",
          "title": "F1 Jump Threshold",
          "type": "number"
        },
        "max_k_value": {
          "default": 10,
          "description": "Max k value",
          "title": "Max K Value",
          "type": "integer"
        },
        "prompt_template": {
          "default": "{word} has the first letter:",
          "description": "Prompt template",
          "title": "Prompt Template",
          "type": "string"
        },
        "prompt_token_pos": {
          "default": -6,
          "description": "Prompt token position",
          "title": "Prompt Token Position",
          "type": "integer"
        },
        "llm_batch_size": {
          "default": 10,
          "description": "LLM batch size. This is set by default in the main script, or it can be set with a command line argument.",
          "title": "LLM Batch Size",
          "type": "integer"
        },
        "llm_dtype": {
          "default": "float32",
          "description": "LLM data type. This is set by default in the main script, or it can be set with a command line argument.",
          "title": "LLM Data Type",
          "type": "string"
        },
        "k_sparse_probe_l1_decay": {
          "default": 0.01,
          "description": "L1 decay for k-sparse probes.",
          "title": "K-Sparse Probe L1 Decay",
          "type": "number"
        },
        "k_sparse_probe_batch_size": {
          "default": 4096,
          "description": "Batch size for k-sparse probes.",
          "title": "K-Sparse Probe Batch Size",
          "type": "integer"
        },
        "k_sparse_probe_num_epochs": {
          "default": 50,
          "description": "Number of epochs for k-sparse probes.",
          "title": "K-Sparse Probe Number of Epochs",
          "type": "integer"
        }
      },
      "title": "AbsorptionEvalConfig",
      "type": "object"
    },
    "AbsorptionMeanMetrics": {
      "properties": {
        "mean_absorption_fraction_score": {
          "description": "Average of the absorption fraction scores across all letters",
          "title": "Mean Absorption Fraction Score",
          "type": "number",
          "ui_default_display": true
        },
        "mean_full_absorption_score": {
          "description": "Average of the full absorption scores across all letters",
          "title": "Mean Full Absorption Score",
          "type": "number",
          "ui_default_display": true
        },
        "mean_num_split_features": {
          "description": "Average number of split features across all letters",
          "title": "Mean Number of Split Features",
          "type": "number",
          "ui_default_display": true
        },
        "std_dev_absorption_fraction_score": {
          "description": "Standard deviation of the absorption fraction scores across all letters",
          "title": "Standard Deviation of Absorption Fraction Score",
          "type": "number"
        },
        "std_dev_full_absorption_score": {
          "description": "Standard deviation of the full absorption scores across all letters",
          "title": "Standard Deviation of Full Absorption Score",
          "type": "number"
        },
        "std_dev_num_split_features": {
          "description": "Standard deviation of the number of split features across all letters",
          "title": "Standard Deviation of Number of Split Features",
          "type": "number"
        }
      },
      "required": [
        "mean_absorption_fraction_score",
        "mean_full_absorption_score",
        "mean_num_split_features",
        "std_dev_absorption_fraction_score",
        "std_dev_full_absorption_score",
        "std_dev_num_split_features"
      ],
      "title": "AbsorptionMeanMetrics",
      "type": "object"
    },
    "AbsorptionMetricCategories": {
      "properties": {
        "mean": {
          "$ref": "#/$defs/AbsorptionMeanMetrics",
          "description": "Mean metrics",
          "title": "Mean",
          "ui_default_display": true
        }
      },
      "required": [
        "mean"
      ],
      "title": "AbsorptionMetricCategories",
      "type": "object"
    },
    "AbsorptionResultDetail": {
      "properties": {
        "first_letter": {
          "description": "",
          "title": "First Letter",
          "type": "string"
        },
        "mean_absorption_fraction": {
          "description": "",
          "title": "Mean Absorption Fraction",
          "type": "number"
        },
        "full_absorption_rate": {
          "description": "",
          "title": "Rate of Full Absorption",
          "type": "number"
        },
        "num_full_absorption": {
          "description": "",
          "title": "Num Full Absorption",
          "type": "integer"
        },
        "num_probe_true_positives": {
          "description": "",
          "title": "Num Probe True Positives",
          "type": "integer"
        },
        "num_split_features": {
          "description": "",
          "title": "Num Split Features",
          "type": "integer"
        }
      },
      "required": [
        "first_letter",
        "mean_absorption_fraction",
        "full_absorption_rate",
        "num_full_absorption",
        "num_probe_true_positives",
        "num_split_features"
      ],
      "title": "AbsorptionResultDetail",
      "type": "object"
    }
  },
  "description": "The feature absorption evaluation looking at the first letter.",
  "properties": {
    "eval_type_id": {
      "default": "absorption_first_letter",
      "description": "The type of the evaluation",
      "title": "Eval Type ID",
      "type": "string"
    },
    "eval_config": {
      "$ref": "#/$defs/AbsorptionEvalConfig",
      "description": "The configuration of the evaluation.",
      "title": "Eval Config Type"
    },
    "eval_id": {
      "description": "A unique UUID identifying this specific eval run",
      "title": "ID",
      "type": "string"
    },
    "datetime_epoch_millis": {
      "description": "The datetime of the evaluation in epoch milliseconds",
      "title": "DateTime (epoch ms)",
      "type": "integer"
    },
    "eval_result_metrics": {
      "$ref": "#/$defs/AbsorptionMetricCategories",
      "description": "The metrics of the evaluation, organized by category. Define your own categories and the metrics that go inside them.",
      "title": "Result Metrics Categorized"
    },
    "eval_result_details": {
      "description": "Each object is a stat on the first letter of the absorption.",
      "items": {
        "$ref": "#/$defs/AbsorptionResultDetail"
      },
      "title": "Per-Letter Absorption Results",
      "type": "array"
    },
    "sae_bench_commit_hash": {
      "description": "The commit hash of the SAE Bench that ran the evaluation.",
      "title": "SAE Bench Commit Hash",
      "type": "string"
    },
    "sae_lens_id": {
      "anyOf": [
        {
          "type": "string"
        },
        {
          "type": "null"
        }
      ],
      "description": "The ID of the SAE in SAE Lens.",
      "title": "SAE Lens ID"
    },
    "sae_lens_release_id": {
      "anyOf": [
        {
          "type": "string"
        },
        {
          "type": "null"
        }
      ],
      "description": "The release ID of the SAE in SAE Lens.",
      "title": "SAE Lens Release ID"
    },
    "sae_lens_version": {
      "anyOf": [
        {
          "type": "string"
        },
        {
          "type": "null"
        }
      ],
      "description": "The version of SAE Lens that ran the evaluation.",
      "title": "SAE Lens Version"
    },
    "sae_cfg_dict": {
      "anyOf": [
        {
          "type": "object"
        },
        {
          "type": "null"
        }
      ],
      "description": "The configuration of the SAE (custom or from SAE Lens) that ran the evaluation. This should match the SAE Lens config schema.",
      "title": "SAE Config Dict"
    },
    "eval_result_unstructured": {
      "anyOf": [
        {},
        {
          "type": "null"
        }
      ],
      "default": null,
      "description": "Optional. Any additional outputs that don't fit into the structured eval_result_metrics or eval_result_details fields. Since these are unstructured, don't expect this to be easily renderable in UIs, or contain any titles or descriptions.",
      "title": "Unstructured Results"
    }
  },
  "required": [
    "eval_config",
    "eval_id",
    "datetime_epoch_millis",
    "eval_result_metrics",
    "sae_bench_commit_hash",
    "sae_lens_id",
    "sae_lens_release_id",
    "sae_lens_version",
    "sae_cfg_dict"
  ],
  "title": "Absorption",
  "type": "object"
}