{
  "dataset": {
    "breedCount": 100,
    "id": "tsinghua100_dense",
    "imageCount": 8000,
    "imagesPerBreed": {
      "max": 80,
      "min": 80
    },
    "licenseNote": "Dataset-derived images are not published here. Manifest records official-page-license-not-specified.",
    "name": "Tsinghua Dogs 100-breed dense subset",
    "rawImageCountOnDisk": 8000,
    "split": {
      "calibration": 2000,
      "test": 2000,
      "train": 4000
    }
  },
  "definitions": {
    "hierarchicalConformalFi": "For a target breed, the fraction of confuser examples whose hierarchical cluster diagnostic still includes the target breed.",
    "perClassCoverage": "RAPS empirical coverage restricted to the true breed rows in the 2,000-image test split.",
    "perClassEce": "10-bin top-confidence ECE computed within each true-breed subset. Each breed has 20 test examples, so this is diagnostic.",
    "structuredPoolingFi": "For a target breed, the fraction of confuser examples whose structured-pooling diagnostic still includes the target breed.",
    "weakClassFalseInclusion": "For the local binary target-vs-confuser probe, the fraction of confuser-cluster examples whose prediction set still includes the target breed."
  },
  "headlineMetrics": {
    "aggregateRapsCoverage": 0.968,
    "aggregateRapsCoverageDisplay": 0.968,
    "eceAfterTemperatureScaling": 0.0508,
    "eceAfterTemperatureScalingDisplay": 0.051,
    "meanRapsSetSize": 2.5885,
    "meanRapsSetSizeDisplay": 2.59,
    "medianRapsSetSize": 2.0,
    "p90RapsSetSize": 3.0,
    "rapsEmptySetCount": 0,
    "rapsMaxSetSize": 9,
    "rapsMissCount": 64,
    "top1Accuracy": 0.8455,
    "top1AccuracyDisplay": 0.846
  },
  "highFiClusterExperiments": {
    "boundary": "Structured pooling and hierarchical conformal rows are high-FI cluster diagnostics. They are not replacements for the global 100-way RAPS predictor.",
    "claimStatus": "WIN: both structured pooling and hierarchical conformal meet the stated false-inclusion gate. Select structured_pooling by target-class coverage first, then false inclusion. Report coverage tradeoffs explicitly; this is not a deployable classifier fix.",
    "laneVerdict": {
      "hierarchical_conformal": "WIN",
      "structured_pooling": "WIN",
      "winner": "structured_pooling",
      "winner_selection_rule": "among methods satisfying the false-inclusion gate, prefer higher target-class coverage on the held-out rows, then lower target false inclusion"
    },
    "metrics": {
      "hierarchical_conformal_success": 1.0,
      "structured_pooling_success": 1.0,
      "target_baseline_false_inclusion": 0.65,
      "target_hierarchical_false_inclusion": 0.0667,
      "target_structured_false_inclusion": 0.1
    },
    "rows": [
      {
        "baselineFalseInclusion": 0.0,
        "baselineTargetCoverage": 0.9,
        "breed": "bluetick",
        "globalRapsCoverage": 0.9,
        "hierarchicalFalseInclusion": 0.0,
        "hierarchicalTargetCoverage": 0.9,
        "hierarchicalTier1ClusterCoverage": 0.9125,
        "mondrianRapsCoverage": 0.6,
        "structuredFalseInclusion": 0.0,
        "structuredSelectedQuorum": 3,
        "structuredTargetCoverage": 0.85
      },
      {
        "baselineFalseInclusion": 0.0833,
        "baselineTargetCoverage": 0.8,
        "breed": "great_dane",
        "globalRapsCoverage": 0.8,
        "hierarchicalFalseInclusion": 0.0,
        "hierarchicalTargetCoverage": 0.5,
        "hierarchicalTier1ClusterCoverage": 0.875,
        "mondrianRapsCoverage": 0.7,
        "structuredFalseInclusion": 0.0167,
        "structuredSelectedQuorum": 3,
        "structuredTargetCoverage": 0.6
      },
      {
        "baselineFalseInclusion": 0.2833,
        "baselineTargetCoverage": 0.95,
        "breed": "lhasa",
        "globalRapsCoverage": 0.85,
        "hierarchicalFalseInclusion": 0.1167,
        "hierarchicalTargetCoverage": 0.95,
        "hierarchicalTier1ClusterCoverage": 0.9625,
        "mondrianRapsCoverage": 0.85,
        "structuredFalseInclusion": 0.1167,
        "structuredSelectedQuorum": 3,
        "structuredTargetCoverage": 0.8
      },
      {
        "baselineFalseInclusion": 0.65,
        "baselineTargetCoverage": 0.95,
        "breed": "tibetan_mastiff",
        "globalRapsCoverage": 0.85,
        "hierarchicalFalseInclusion": 0.0667,
        "hierarchicalTargetCoverage": 0.85,
        "hierarchicalTier1ClusterCoverage": 0.8875,
        "mondrianRapsCoverage": 0.9,
        "structuredFalseInclusion": 0.1,
        "structuredSelectedQuorum": 3,
        "structuredTargetCoverage": 0.95
      }
    ],
    "selection": {
      "confusers": "temperature_scaled_nearest_prototype_test_errors_with_probability_backfill",
      "linear_probe_l2_metric": "calibration_nll",
      "structured_pooling_quorum": "selected on calibration rows by minimum false inclusion among quorums with calibration target coverage at or above target coverage",
      "used_test_labels_for_method_selection": false
    },
    "successMetric": {
      "held_out_non_degradation_classes": [
        "bluetick",
        "great_dane",
        "lhasa"
      ],
      "non_degradation_definition": "candidate false inclusion must be less than or equal to the baseline local linear-head false inclusion on the held-out test rows",
      "target_class": "tibetan_mastiff",
      "target_false_inclusion_goal": 0.2
    },
    "targetCoverage": 0.9
  },
  "links": {
    "methodology": "https://www.smartbreeds.io/reliability#methodology",
    "rawJson": "https://www.smartbreeds.io/api/reproducibility/tsinghua100-dense"
  },
  "model": {
    "classifier": "frozen DINOv2-small nearest-prototype head",
    "featureExtractor": "timm:vit_small_patch14_dinov2.lvd142m",
    "id": "dinov2_small_lvd142m_v0",
    "seed": 7,
    "temperature": 0.04583187
  },
  "perClass": [
    {
      "breed": "affenpinscher",
      "coverage": 1.0,
      "ece": 0.0435,
      "meanSetSize": 2.1,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "afghan_hound",
      "coverage": 1.0,
      "ece": 0.0661,
      "meanSetSize": 2.2,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "african_hunting_dog",
      "coverage": 1.0,
      "ece": 0.015,
      "meanSetSize": 2.05,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "airedale",
      "coverage": 1.0,
      "ece": 0.2703,
      "meanSetSize": 3.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "american_staffordshire_terrier",
      "coverage": 0.95,
      "ece": 0.1834,
      "meanSetSize": 2.65,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "appenzeller",
      "coverage": 1.0,
      "ece": 0.2162,
      "meanSetSize": 2.95,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "australian_shepherd",
      "coverage": 0.85,
      "ece": 0.2399,
      "meanSetSize": 2.95,
      "missCount": 3,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "australian_terrier",
      "coverage": 0.9,
      "ece": 0.3444,
      "meanSetSize": 2.7,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "basset",
      "coverage": 1.0,
      "ece": 0.1288,
      "meanSetSize": 2.4,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "bedlington_terrier",
      "coverage": 1.0,
      "ece": 0.0965,
      "meanSetSize": 2.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "bernese_mountain_dog",
      "coverage": 1.0,
      "ece": 0.1539,
      "meanSetSize": 2.9,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "black_and_tan_coonhound",
      "coverage": 1.0,
      "ece": 0.1005,
      "meanSetSize": 2.45,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "blenheim_spaniel",
      "coverage": 1.0,
      "ece": 0.112,
      "meanSetSize": 2.35,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "bloodhound",
      "coverage": 1.0,
      "ece": 0.084,
      "meanSetSize": 2.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "bluetick",
      "coverage": 0.9,
      "ece": 0.1702,
      "meanSetSize": 2.55,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": 0.0
    },
    {
      "breed": "border_terrier",
      "coverage": 1.0,
      "ece": 0.0746,
      "meanSetSize": 2.2,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "borzoi",
      "coverage": 0.95,
      "ece": 0.0926,
      "meanSetSize": 2.45,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "boston_bull",
      "coverage": 1.0,
      "ece": 0.1056,
      "meanSetSize": 2.0,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "bouvier_des_flandres",
      "coverage": 0.95,
      "ece": 0.2537,
      "meanSetSize": 3.1,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "boxer",
      "coverage": 1.0,
      "ece": 0.1636,
      "meanSetSize": 2.4,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "brabancon_griffo",
      "coverage": 1.0,
      "ece": 0.0655,
      "meanSetSize": 2.2,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "briard",
      "coverage": 0.9,
      "ece": 0.0944,
      "meanSetSize": 2.65,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "brittany_spaniel",
      "coverage": 1.0,
      "ece": 0.1594,
      "meanSetSize": 2.45,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "bull_mastiff",
      "coverage": 0.95,
      "ece": 0.1245,
      "meanSetSize": 2.15,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "cairn",
      "coverage": 0.95,
      "ece": 0.175,
      "meanSetSize": 3.0,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "chesapeake_bay_retriever",
      "coverage": 1.0,
      "ece": 0.0969,
      "meanSetSize": 2.4,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "chinese_crested_dog",
      "coverage": 1.0,
      "ece": 0.1311,
      "meanSetSize": 2.45,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "clumber",
      "coverage": 1.0,
      "ece": 0.0817,
      "meanSetSize": 2.25,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "collie",
      "coverage": 1.0,
      "ece": 0.0915,
      "meanSetSize": 2.65,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "curly_coated_retriever",
      "coverage": 0.9,
      "ece": 0.0982,
      "meanSetSize": 2.15,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "dandie_dinmont",
      "coverage": 1.0,
      "ece": 0.1789,
      "meanSetSize": 2.75,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "dhole",
      "coverage": 1.0,
      "ece": 0.0127,
      "meanSetSize": 2.0,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "dingo",
      "coverage": 0.95,
      "ece": 0.1017,
      "meanSetSize": 2.15,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "doberman",
      "coverage": 1.0,
      "ece": 0.1667,
      "meanSetSize": 2.55,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "english_foxhound",
      "coverage": 1.0,
      "ece": 0.2634,
      "meanSetSize": 2.4,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "english_setter",
      "coverage": 0.85,
      "ece": 0.1342,
      "meanSetSize": 2.55,
      "missCount": 3,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "entlebucher",
      "coverage": 1.0,
      "ece": 0.3138,
      "meanSetSize": 3.0,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "eskimo_dog",
      "coverage": 0.95,
      "ece": 0.2259,
      "meanSetSize": 3.35,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "fila_braziliero",
      "coverage": 1.0,
      "ece": 0.1676,
      "meanSetSize": 2.9,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "flat_coated_retriever",
      "coverage": 0.95,
      "ece": 0.1218,
      "meanSetSize": 2.45,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "french_bulldog",
      "coverage": 1.0,
      "ece": 0.0962,
      "meanSetSize": 2.25,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "german_shepherd",
      "coverage": 1.0,
      "ece": 0.0979,
      "meanSetSize": 2.2,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "german_short_haired_pointer",
      "coverage": 0.95,
      "ece": 0.1268,
      "meanSetSize": 2.6,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "giant_schnauzer",
      "coverage": 1.0,
      "ece": 0.2221,
      "meanSetSize": 3.0,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "gordon_setter",
      "coverage": 1.0,
      "ece": 0.1046,
      "meanSetSize": 2.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "great_dane",
      "coverage": 0.8,
      "ece": 0.2178,
      "meanSetSize": 3.45,
      "missCount": 4,
      "testSampleCount": 20,
      "weakClassFalseInclusion": 0.0833
    },
    {
      "breed": "great_pyrenees",
      "coverage": 1.0,
      "ece": 0.2707,
      "meanSetSize": 2.55,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "greater_swiss_mountain_dog",
      "coverage": 0.9,
      "ece": 0.2061,
      "meanSetSize": 3.0,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "groenendael",
      "coverage": 1.0,
      "ece": 0.0446,
      "meanSetSize": 2.1,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "ibizan_hound",
      "coverage": 1.0,
      "ece": 0.0818,
      "meanSetSize": 2.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "irish_setter",
      "coverage": 1.0,
      "ece": 0.1086,
      "meanSetSize": 2.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "irish_terrier",
      "coverage": 0.9,
      "ece": 0.1685,
      "meanSetSize": 3.05,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "irish_water_spaniel",
      "coverage": 1.0,
      "ece": 0.108,
      "meanSetSize": 2.05,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "irish_wolfhound",
      "coverage": 1.0,
      "ece": 0.2652,
      "meanSetSize": 2.75,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "italian_greyhound",
      "coverage": 1.0,
      "ece": 0.1341,
      "meanSetSize": 2.55,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "keeshond",
      "coverage": 1.0,
      "ece": 0.068,
      "meanSetSize": 2.05,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "kelpie",
      "coverage": 0.9,
      "ece": 0.2202,
      "meanSetSize": 2.9,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "kerry_blue_terrier",
      "coverage": 0.9,
      "ece": 0.1929,
      "meanSetSize": 3.25,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "kuvasz",
      "coverage": 0.95,
      "ece": 0.2232,
      "meanSetSize": 2.15,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "lakeland_terrier",
      "coverage": 0.9,
      "ece": 0.2071,
      "meanSetSize": 3.4,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "leonberg",
      "coverage": 1.0,
      "ece": 0.0901,
      "meanSetSize": 2.4,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "lhasa",
      "coverage": 0.85,
      "ece": 0.2019,
      "meanSetSize": 2.35,
      "missCount": 3,
      "testSampleCount": 20,
      "weakClassFalseInclusion": 0.2833
    },
    {
      "breed": "malamute",
      "coverage": 0.95,
      "ece": 0.3718,
      "meanSetSize": 3.4,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "malinois",
      "coverage": 1.0,
      "ece": 0.1225,
      "meanSetSize": 2.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "mexican_hairless",
      "coverage": 1.0,
      "ece": 0.1291,
      "meanSetSize": 2.45,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "miniature_poodle",
      "coverage": 0.9,
      "ece": 0.1739,
      "meanSetSize": 2.3,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "newfoundland",
      "coverage": 1.0,
      "ece": 0.0878,
      "meanSetSize": 2.25,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "norfolk_terrier",
      "coverage": 0.95,
      "ece": 0.2596,
      "meanSetSize": 3.3,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "norwegian_elkhound",
      "coverage": 1.0,
      "ece": 0.1433,
      "meanSetSize": 2.5,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "norwich_terrier",
      "coverage": 0.85,
      "ece": 0.2021,
      "meanSetSize": 3.0,
      "missCount": 3,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "otterhound",
      "coverage": 1.0,
      "ece": 0.2053,
      "meanSetSize": 2.8,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "pembroke",
      "coverage": 1.0,
      "ece": 0.0614,
      "meanSetSize": 2.25,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "pomeranian",
      "coverage": 0.95,
      "ece": 0.0887,
      "meanSetSize": 2.7,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "redbone",
      "coverage": 0.9,
      "ece": 0.2729,
      "meanSetSize": 3.35,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "rhodesian_ridgeback",
      "coverage": 1.0,
      "ece": 0.2055,
      "meanSetSize": 3.0,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "rottweiler",
      "coverage": 1.0,
      "ece": 0.1186,
      "meanSetSize": 2.6,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "saint_bernard",
      "coverage": 1.0,
      "ece": 0.0898,
      "meanSetSize": 2.45,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "saluki",
      "coverage": 1.0,
      "ece": 0.0651,
      "meanSetSize": 2.4,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "samoyed",
      "coverage": 1.0,
      "ece": 0.061,
      "meanSetSize": 2.3,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "schipperke",
      "coverage": 1.0,
      "ece": 0.058,
      "meanSetSize": 2.05,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "scotch_terrier",
      "coverage": 0.95,
      "ece": 0.2262,
      "meanSetSize": 3.0,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "scottish_deerhound",
      "coverage": 1.0,
      "ece": 0.2323,
      "meanSetSize": 2.1,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "sealyham_terrier",
      "coverage": 0.95,
      "ece": 0.1347,
      "meanSetSize": 2.55,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "shiba_dog",
      "coverage": 0.9,
      "ece": 0.0671,
      "meanSetSize": 2.25,
      "missCount": 2,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "siberian_husky",
      "coverage": 0.95,
      "ece": 0.2014,
      "meanSetSize": 3.0,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "silky_terrier",
      "coverage": 1.0,
      "ece": 0.1301,
      "meanSetSize": 2.65,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "soft_coated_wheaten_terrier",
      "coverage": 0.85,
      "ece": 0.1043,
      "meanSetSize": 3.7,
      "missCount": 3,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "staffordshire_bullterrier",
      "coverage": 1.0,
      "ece": 0.1606,
      "meanSetSize": 2.6,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "standard_schnauzer",
      "coverage": 1.0,
      "ece": 0.1503,
      "meanSetSize": 3.15,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "sussex_spaniel",
      "coverage": 1.0,
      "ece": 0.0702,
      "meanSetSize": 2.2,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "tibetan_mastiff",
      "coverage": 0.85,
      "ece": 0.2393,
      "meanSetSize": 2.5,
      "missCount": 3,
      "testSampleCount": 20,
      "weakClassFalseInclusion": 0.65
    },
    {
      "breed": "tibetan_terrier",
      "coverage": 1.0,
      "ece": 0.1751,
      "meanSetSize": 2.7,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "toy_terrier",
      "coverage": 1.0,
      "ece": 0.1187,
      "meanSetSize": 2.4,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "vizsla",
      "coverage": 1.0,
      "ece": 0.3496,
      "meanSetSize": 3.0,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "walker_hound",
      "coverage": 1.0,
      "ece": 0.1889,
      "meanSetSize": 2.85,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "weimaraner",
      "coverage": 1.0,
      "ece": 0.1525,
      "meanSetSize": 2.65,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "welsh_springer_spaniel",
      "coverage": 0.95,
      "ece": 0.1587,
      "meanSetSize": 2.95,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "west_highland_white_terrier",
      "coverage": 1.0,
      "ece": 0.1365,
      "meanSetSize": 2.1,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "whippet",
      "coverage": 0.95,
      "ece": 0.1933,
      "meanSetSize": 2.55,
      "missCount": 1,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    },
    {
      "breed": "wire_haired_fox_terrier",
      "coverage": 1.0,
      "ece": 0.1519,
      "meanSetSize": 2.85,
      "missCount": 0,
      "testSampleCount": 20,
      "weakClassFalseInclusion": null
    }
  ],
  "raps": {
    "alpha": 0.1,
    "selectedParameters": {
      "k_reg": 1,
      "penalty_lambda": 0.1
    },
    "selectionPolicy": "Pick the eligible parameter set with smallest tuning mean set size. Ties prefer higher tuning coverage, then smaller penalty and k.",
    "selectionStatus": "selected_from_candidates_meeting_tuning_coverage",
    "targetCoverage": 0.9
  },
  "refresh": {
    "artifactCreatedAt": "2026-06-02T00:33:29.886244+00:00",
    "artifactRefreshCadence": "Regenerated when SmartBreeds research artifacts are refreshed; public endpoint cache revalidates hourly.",
    "endpointCache": "1 hour",
    "lastRefreshedAt": "2026-06-04T16:39:12.084291+00:00"
  },
  "schemaVersion": "smartbreeds.reproducibility.tsinghua100-dense.v2",
  "sourceArtifacts": [
    {
      "path": "data/evaluations/tsinghua100_dense_dinov2_small_lvd142m_v0_raps_tuning.json",
      "repo": "Robby955/SmartBreeds"
    },
    {
      "path": "data/evaluations/tsinghua100_dense_dinov2_small_lvd142m_v0_local_discriminant_heads.json",
      "repo": "Robby955/SmartBreeds"
    },
    {
      "path": "data/evaluations/tsinghua100_dense_dinov2_small_lvd142m_v0_cluster_conformal.json",
      "repo": "Robby955/SmartBreeds"
    },
    {
      "path": "data/evaluations/tsinghua100_dense_dinov2_small_lvd142m_v0_score_cache.npz",
      "repo": "Robby955/SmartBreeds"
    },
    {
      "path": "data/sources/tsinghua_dogs_tsinghua100_dense_manifest.jsonl",
      "repo": "Robby955/SmartBreeds"
    }
  ],
  "weakClassFalseInclusion": {
    "bluetick": 0.0,
    "great_dane": 0.0833,
    "lhasa": 0.2833,
    "tibetan_mastiff": 0.65
  }
}
