{
  "id": "bbg-p0212-algorithms-and-decision-models-algorithms",
  "title": "Space-Saving Data Structures",
  "chapter": "algorithms-and-decision-models",
  "batch": "26",
  "rank": 255,
  "sourcePage": 212,
  "sourcePointer": "p. 212",
  "status": "accepted",
  "reviewerStatus": "reviewed",
  "fidelityScore": 0.9,
  "canvas": {
    "width": 960,
    "height": 640
  },
  "fireworksTechGraph": {
    "style": "style-1-flat-icon",
    "diagramType": "comparison",
    "topologyNotes": [
      "source page render inspected",
      "extracted page text inspected",
      "source page render inspected",
      "preserve six space-saving structures: Bloom filter, HyperLogLog, Cuckoo filter, MinHash, SimHash, and Count-Min Sketch",
      "omit tiny source illustrations and copied prose"
    ],
    "publicBoundary": [
      "original vector output",
      "no source pixels",
      "no source mark or long wording"
    ]
  },
  "callouts": [],
  "sourceReview": {
    "conceptAnchors": [
      "concept: approximate membership",
      "concept: cardinality estimate",
      "concept: deletion-capable filter",
      "concept: similarity estimate",
      "concept: frequency estimate"
    ],
    "labelSource": "curated",
    "semanticStatus": "reviewed"
  },
  "groups": [
    {
      "id": "membership",
      "label": "Membership",
      "x": 62,
      "y": 128,
      "w": 242,
      "h": 286
    },
    {
      "id": "similarity",
      "label": "Similarity",
      "x": 360,
      "y": 128,
      "w": 242,
      "h": 286
    },
    {
      "id": "counting",
      "label": "Counting",
      "x": 658,
      "y": 128,
      "w": 242,
      "h": 286
    }
  ],
  "shapes": [
    {
      "id": "bloom",
      "kind": "rect",
      "label": "Bloom filter",
      "detail": "maybe in set",
      "x": 100,
      "y": 176,
      "w": 122,
      "h": 54,
      "tone": "blue"
    },
    {
      "id": "cuckoo",
      "kind": "rect",
      "label": "Cuckoo filter",
      "detail": "deletable",
      "x": 100,
      "y": 304,
      "w": 122,
      "h": 54,
      "tone": "orange"
    },
    {
      "id": "minhash",
      "kind": "rect",
      "label": "MinHash",
      "detail": "set similarity",
      "x": 400,
      "y": 176,
      "w": 122,
      "h": 54,
      "tone": "green"
    },
    {
      "id": "simhash",
      "kind": "rect",
      "label": "SimHash",
      "detail": "near duplicate",
      "x": 400,
      "y": 304,
      "w": 122,
      "h": 54,
      "tone": "purple"
    },
    {
      "id": "hll",
      "kind": "rect",
      "label": "HyperLogLog",
      "detail": "cardinality",
      "x": 700,
      "y": 176,
      "w": 122,
      "h": 54,
      "tone": "teal"
    },
    {
      "id": "cms",
      "kind": "table",
      "label": "Count-Min",
      "detail": "frequency",
      "x": 700,
      "y": 298,
      "w": 122,
      "h": 66,
      "tone": "gray"
    }
  ],
  "connectors": [
    {
      "from": "bloom",
      "to": "cuckoo",
      "label": "delete",
      "flow": "control"
    },
    {
      "from": "minhash",
      "to": "simhash",
      "label": "compare",
      "flow": "data"
    },
    {
      "from": "hll",
      "to": "cms",
      "label": "estimate",
      "flow": "data"
    },
    {
      "from": "bloom",
      "to": "hll",
      "label": "compact",
      "flow": "main"
    },
    {
      "from": "simhash",
      "to": "cms",
      "label": "sketch",
      "flow": "async"
    }
  ]
}
