{
  "title": "Recipe Site Markup Coverage and Extraction Observations 2026",
  "generatedAt": "2026-05-12T17:53:10.153Z",
  "source": "RecipeStripper public site inventory plus anonymized domain-level strip_log aggregate",
  "privacy": "No submitted recipe URLs, user identifiers, IP addresses, or saved recipe content are included.",
  "license": "CC BY 4.0",
  "siteInventoryCount": 137,
  "blockedOrLimitedCount": 4,
  "categoryCounts": {
    "major": 26,
    "baking": 8,
    "healthy": 20,
    "food-blog": 43,
    "international": 20,
    "niche": 20
  },
  "stripLogRowsAggregated": 441,
  "observedDomainCount": 122,
  "observedSuccesses": 216,
  "observedFailures": 225,
  "dataFiles": [
    "site-inventory.csv",
    "site-inventory.json",
    "domain-extraction-observations.csv",
    "domain-extraction-observations.json"
  ],
  "caveats": [
    "The site inventory is a product support inventory, not a crawl of every URL on each domain.",
    "The domain observations are anonymized operational aggregates from RecipeStripper extraction attempts.",
    "Success rates are usage-weighted by submitted URLs and should not be interpreted as a representative web-wide benchmark."
  ]
}
