{
  "benchmark": "cyp3a4_inducer_v25_external_holdout",
  "version": "v25_physics",
  "generated": "2026-04-27T14:12:13",
  "input": "validation_data/cyp3a4_inducer_v16_larger_control_holdout.json",
  "prediction_basis": "Flux Physics",
  "basis_note": "On-the-fly Flux physics scorer. Reference labels are used for benchmark scoring, not to produce predictions.",
  "primary_metric": {
    "description": "Primary-only external metric after excluding rows overlapping the current reference snapshot.",
    "n": 405,
    "balanced_accuracy": 0.9350,
    "accuracy": 0.9926,
    "precision": 0.7778,
    "recall": 0.8750,
    "specificity": 0.9950,
    "f1": 0.8235,
    "tp": 7,
    "fp": 2,
    "fn": 1,
    "tn": 395
  },
  "all_scored_rows": {
    "n": 686,
    "balanced_accuracy": 0.9652,
    "accuracy": 0.9956,
    "precision": 0.8750,
    "recall": 0.9333,
    "specificity": 0.9970,
    "f1": 0.9032,
    "tp": 14,
    "fp": 2,
    "fn": 1,
    "tn": 669
  },
  "gate": {
    "external_balanced_accuracy_ge_0_75": "PASS",
    "external_recall_ge_0_70": "PASS",
    "external_specificity_ge_0_75": "PASS"
  }
}
