{
  "id": "bbg-p0276-architecture-source-map-architecture-source",
  "title": "Open Model Inference Flow",
  "chapter": "ai-models-and-llm-systems",
  "batch": "15",
  "rank": 141,
  "sourcePage": 276,
  "sourcePointer": "p. 276",
  "status": "accepted",
  "reviewerStatus": "reviewed",
  "fidelityScore": 0.9,
  "canvas": {
    "width": 960,
    "height": 640
  },
  "fireworksTechGraph": {
    "style": "style-1-flat-icon",
    "diagramType": "data-flow",
    "topologyNotes": [
      "source page render inspected",
      "extracted page text inspected",
      "preserve coarse grouping, sequence, and hierarchy from the inspected candidate page",
      "short generic labels only"
    ],
    "publicBoundary": [
      "original vector output",
      "no source pixels",
      "no source mark or long wording"
    ]
  },
  "callouts": [],
  "sourceReview": {
    "conceptAnchors": [
      "concept: LLM",
      "concept: How",
      "concept: Llm",
      "concept: Architecture Source Map"
    ],
    "labelSource": "source-summary",
    "semanticStatus": "reviewed"
  },
  "groups": [
    {
      "id": "input",
      "label": "Input path",
      "x": 56,
      "y": 150,
      "w": 220,
      "h": 260
    },
    {
      "id": "model",
      "label": "Model core",
      "x": 338,
      "y": 122,
      "w": 294,
      "h": 318
    },
    {
      "id": "output",
      "label": "Output path",
      "x": 694,
      "y": 150,
      "w": 210,
      "h": 260
    }
  ],
  "shapes": [
    {
      "id": "prompt",
      "kind": "rect",
      "label": "Prompt",
      "detail": "text input",
      "x": 102,
      "y": 192,
      "w": 118,
      "h": 58,
      "tone": "blue"
    },
    {
      "id": "tokens",
      "kind": "rect",
      "label": "Tokens",
      "detail": "IDs",
      "x": 102,
      "y": 318,
      "w": 118,
      "h": 58,
      "tone": "teal"
    },
    {
      "id": "router",
      "kind": "gateway",
      "label": "Sparse router",
      "detail": "expert choice",
      "x": 384,
      "y": 176,
      "w": 122,
      "h": 82,
      "tone": "orange"
    },
    {
      "id": "experts",
      "kind": "rect",
      "label": "Experts",
      "detail": "model blocks",
      "x": 474,
      "y": 318,
      "w": 118,
      "h": 58,
      "tone": "purple"
    },
    {
      "id": "context",
      "kind": "cylinder",
      "label": "Context",
      "detail": "attention",
      "x": 370,
      "y": 318,
      "w": 96,
      "h": 74,
      "tone": "green"
    },
    {
      "id": "decode",
      "kind": "rect",
      "label": "Decode",
      "detail": "next tokens",
      "x": 738,
      "y": 214,
      "w": 118,
      "h": 58,
      "tone": "blue"
    },
    {
      "id": "answer",
      "kind": "rect",
      "label": "Answer",
      "detail": "generated text",
      "x": 738,
      "y": 334,
      "w": 118,
      "h": 58,
      "tone": "green"
    }
  ],
  "connectors": [
    {
      "from": "prompt",
      "to": "tokens",
      "label": "tokenize",
      "flow": "main"
    },
    {
      "from": "tokens",
      "to": "router",
      "label": "embed",
      "flow": "data"
    },
    {
      "from": "router",
      "to": "experts",
      "label": "activate",
      "flow": "control"
    },
    {
      "from": "context",
      "to": "experts",
      "label": "attend",
      "flow": "data"
    },
    {
      "from": "experts",
      "to": "decode",
      "label": "logits",
      "flow": "main"
    },
    {
      "from": "decode",
      "to": "answer",
      "label": "detokenize",
      "flow": "main"
    }
  ]
}
