diff --git a/.agent-plan.md b/.agent-plan.md
index 4ed3a55..04dc996 100644
--- a/.agent-plan.md
+++ b/.agent-plan.md
@@ -6,35 +6,42 @@
 
 ## Current System State
 
-**v0.4.0 in progress — Milestone 7 complete (PR open).** Full simulation engine implemented:
-per-lead mutable state, 90-day daily-step loop, touch/session/sales-activity emission,
-HazardTransition stage advancement, ConversionHazard final-close, and post-conversion
-opportunity/customer/subscription creation. 490 tests passing.
+**v0.4.0 in progress — Milestones 7–8 complete (PRs open).** Full simulation engine + render/bundle
+layer implemented. 521 tests passing.
 
 ---
 
-## Active Task Breakdown — Milestone 8: Observation Model (v0.4.0)
+## Next Up — Milestone 9: Exposure Filtering (v0.4.0)
 
-Goal: Transform the hidden simulated world into realistic CRM-like observations.
+Goal: Apply `student_public` / `research_instructor` exposure-mode filtering during bundle write.
 
-- [ ] **1. Snapshot builder** (`render/snapshots.py`) — lead-anchored flat feature snapshot
-- [ ] **2. Relational export** (`render/relational.py`) — DataFrame per table from SimulationResult
-- [ ] **3. Task export** (`render/tasks.py`) — train/valid/test Parquet split for `converted_within_90_days`
-- [ ] **4. Manifest builder** (`render/manifests.py`) — bundle manifest.json
-- [ ] **5. Bundle writer** (`api/bundle.py`) — `WorldBundle.save(path)`
+- [ ] `exposure/modes.py` — `ExposureMode`-aware filter dispatch
+- [ ] `exposure/filters.py` — column/table redaction rules per mode
+- [ ] `exposure/redaction.py` — latent-column scrubbing for `student_public`
+- [ ] Wire into `api/bundle.py` write pipeline
 
 ---
 
 ## Context Pointers
 
-- Milestone 7 scope: `docs/leadforge_implementation_plan.md` §10 "Milestone 7"
-- Simulation spec: `docs/leadforge_architecture_spec.md` §11 "Simulation engine"
-- Mechanism layer: `leadforge/mechanisms/` (all M6 files)
+- Milestone 8 scope: `docs/leadforge_implementation_plan.md` §10 "Milestone 8"
+- Render layer: `leadforge/render/` (snapshots, relational, tasks, manifests)
+- Bundle writer: `leadforge/api/bundle.py`
 
 ---
 
 ## Completed Phases
 
+### Milestone 8 — Render / Bundle Layer ✓ (v0.4.0 in PR)
+- `render/relational.py`: `to_dataframes()` — 9-table dict of typed DataFrames from SimulationResult + PopulationResult
+- `render/snapshots.py`: `build_snapshot()` — 30-column leakage-free lead snapshot with touch/session/activity aggregates, account/contact field joins
+- `render/tasks.py`: `write_task_splits()` — deterministic 70/15/15 train/valid/test Parquet split + `task_manifest.json`
+- `render/manifests.py`: `build_manifest()` / `write_manifest()` — manifest.json with provenance, row counts, SHA-256 hashes
+- `api/bundle.py`: `write_bundle()` — orchestrates all render steps; writes full bundle to disk
+- `core/models.py`: `WorldBundle.save(path)` — delegates to `write_bundle()` via lazy import
+- `api/generator.py`: `Generator.generate()` — fully implemented end-to-end flow
+- 31 new render tests; total 521 passing
+
 ### Milestone 7 — Simulation Engine ✓ (v0.4.0 in PR)
 - `simulation/state.py`: `LeadSimState` — per-lead mutable state (stage, dwell, converted, churned, sql_day)
 - `simulation/engine.py`: `simulate_world()` — 90-day daily-step loop; `SimulationResult` output type
diff --git a/leadforge/api/bundle.py b/leadforge/api/bundle.py
new file mode 100644
index 0000000..2cfdb4c
--- /dev/null
+++ b/leadforge/api/bundle.py
@@ -0,0 +1,86 @@
+"""Bundle writer — assembles and serialises the full output bundle.
+
+:func:`write_bundle` is called by :meth:`WorldBundle.save` and orchestrates
+all rendering steps:
+
+1. Write relational Parquet tables (``tables/``).
+2. Build the lead snapshot and write task splits (``tasks/``).
+3. Write ``dataset_card.md`` and ``feature_dictionary.csv``.
+4. Build and write ``manifest.json``.
+"""
+
+from __future__ import annotations
+
+from pathlib import Path
+from typing import TYPE_CHECKING
+
+from leadforge.narrative.dataset_card import render_dataset_card
+from leadforge.render.manifests import build_manifest, write_manifest
+from leadforge.render.relational import to_dataframes
+from leadforge.render.snapshots import build_snapshot
+from leadforge.render.tasks import write_task_splits
+from leadforge.schema.dictionaries import write_feature_dictionary
+from leadforge.schema.tables import write_parquet
+from leadforge.schema.tasks import CONVERTED_WITHIN_90_DAYS
+
+if TYPE_CHECKING:
+    from leadforge.core.models import WorldBundle
+
+
+def write_bundle(bundle: WorldBundle, path: str) -> None:
+    """Write *bundle* to disk at *path*.
+
+    Args:
+        bundle: Fully populated :class:`~leadforge.core.models.WorldBundle`.
+        path: Destination directory (created if absent).
+
+    Raises:
+        RuntimeError: if any of ``bundle.simulation_result``,
+            ``bundle.population``, or ``bundle.world_graph`` are ``None``.
+    """
+    if bundle.simulation_result is None or bundle.population is None or bundle.world_graph is None:
+        raise RuntimeError("WorldBundle is not fully populated. Call Generator.generate() first.")
+
+    root = Path(path)
+    root.mkdir(parents=True, exist_ok=True)
+
+    config = bundle.spec.config
+    result = bundle.simulation_result
+    population = bundle.population
+    world_graph = bundle.world_graph
+
+    # ------------------------------------------------------------------
+    # 1. Relational tables → tables/
+    # ------------------------------------------------------------------
+    tables_dir = root / "tables"
+    tables_dir.mkdir(exist_ok=True)
+
+    dfs = to_dataframes(result, population)
+    table_row_counts: dict[str, int] = {}
+    for table_name, df in dfs.items():
+        write_parquet(df, tables_dir / f"{table_name}.parquet")
+        table_row_counts[table_name] = len(df)
+
+    # ------------------------------------------------------------------
+    # 2. Snapshot + task splits → tasks/
+    # ------------------------------------------------------------------
+    snapshot = build_snapshot(result, population, horizon_days=config.horizon_days)
+    task_row_counts = write_task_splits(snapshot, root / "tasks", seed=config.seed)
+
+    # ------------------------------------------------------------------
+    # 3. Dataset card and feature dictionary
+    # ------------------------------------------------------------------
+    (root / "dataset_card.md").write_text(render_dataset_card(bundle.spec))
+    write_feature_dictionary(root / "feature_dictionary.csv")
+
+    # ------------------------------------------------------------------
+    # 4. Manifest
+    # ------------------------------------------------------------------
+    manifest = build_manifest(
+        config=config,
+        world_graph=world_graph,
+        table_row_counts=table_row_counts,
+        task_row_counts={CONVERTED_WITHIN_90_DAYS.task_id: task_row_counts},
+        bundle_root=root,
+    )
+    write_manifest(manifest, root)
diff --git a/leadforge/api/generator.py b/leadforge/api/generator.py
index 0b1cfc8..39a719c 100644
--- a/leadforge/api/generator.py
+++ b/leadforge/api/generator.py
@@ -112,11 +112,67 @@ def generate(
         n_accounts: int | None = None,
         n_contacts: int | None = None,
         n_leads: int | None = None,
-        difficulty: str | DifficultyProfile = DifficultyProfile.intermediate,
+        difficulty: str | DifficultyProfile = _MISSING,  # type: ignore[assignment]
         **kwargs: Any,
     ) -> WorldBundle:
-        """Run the world simulation and return a bundle.
+        """Run the full world simulation and return an in-memory bundle.
+
+        Overrides in *n_accounts*, *n_contacts*, *n_leads*, and *difficulty*
+        take effect for this call only — they do not mutate the Generator.
+        When *difficulty* is omitted the Generator's configured difficulty is used.
+
+        Args:
+            n_accounts: Override account count.
+            n_contacts: Override contact count.
+            n_leads: Override lead count.
+            difficulty: Difficulty profile name or enum value.  Defaults to
+                the difficulty set on the Generator (i.e. from the recipe).
+            **kwargs: Reserved for future use.
 
-        Not yet implemented — available in v0.3.0+.
+        Returns:
+            A fully populated :class:`~leadforge.core.models.WorldBundle`.
+            Call :meth:`~leadforge.core.models.WorldBundle.save` to write it
+            to disk.
         """
-        raise NotImplementedError("Generator.generate() is not yet implemented. Coming in v0.3.0.")
+        import dataclasses
+
+        from leadforge.simulation.engine import simulate_world
+        from leadforge.simulation.population import build_population
+        from leadforge.structure.sampler import sample_hidden_graph
+
+        config = self._world_spec.config
+
+        # Apply per-call overrides without mutating the shared config.
+        overrides: dict[str, Any] = {}
+        if n_accounts is not None:
+            overrides["n_accounts"] = n_accounts
+        if n_contacts is not None:
+            overrides["n_contacts"] = n_contacts
+        if n_leads is not None:
+            overrides["n_leads"] = n_leads
+        if difficulty is not _MISSING:
+            if not isinstance(difficulty, DifficultyProfile):
+                difficulty = DifficultyProfile(difficulty)  # type: ignore[arg-type]
+            if difficulty != config.difficulty:
+                overrides["difficulty"] = difficulty
+        if overrides:
+            config = dataclasses.replace(config, **overrides)
+
+        narrative = self._world_spec.narrative
+        if narrative is None:
+            raise RuntimeError(
+                "No narrative loaded.  Initialise the Generator via "
+                "Generator.from_recipe() to resolve the narrative."
+            )
+
+        world_graph = sample_hidden_graph(config.seed)
+        population = build_population(config, narrative, world_graph)
+        result = simulate_world(config, population, world_graph)
+
+        spec = WorldSpec(config=config, narrative=narrative)
+        return WorldBundle(
+            spec=spec,
+            population=population,
+            simulation_result=result,
+            world_graph=world_graph,
+        )
diff --git a/leadforge/core/models.py b/leadforge/core/models.py
index 1aec86f..d4fe66b 100644
--- a/leadforge/core/models.py
+++ b/leadforge/core/models.py
@@ -11,6 +11,9 @@
 
 if TYPE_CHECKING:
     from leadforge.narrative.spec import NarrativeSpec
+    from leadforge.simulation.engine import SimulationResult
+    from leadforge.simulation.population import PopulationResult
+    from leadforge.structure.graph import WorldGraph
 
 
 def _require_positive_int(value: Any, name: str) -> None:
@@ -90,7 +93,44 @@ class WorldSpec:
 class WorldBundle:
     """In-memory result of one complete generation run.
 
-    Populated in Milestone 7+ (simulation and rendering).
+    Holds all generated artefacts and provides :meth:`save` to write the
+    full output bundle to disk.
+
+    Attributes:
+        spec: Fully resolved world specification (config + narrative).
+        population: Generated accounts, contacts, leads, and latent state.
+        simulation_result: Simulated event tables and final lead outcomes.
+        world_graph: Sampled hidden world graph used during simulation.
     """
 
     spec: WorldSpec = field(default_factory=WorldSpec)
+    population: PopulationResult | None = None
+    simulation_result: SimulationResult | None = None
+    world_graph: WorldGraph | None = None
+
+    def save(self, path: str) -> None:
+        """Write the full output bundle to *path*.
+
+        Creates the directory if it does not exist.  The bundle layout
+        matches the canonical structure defined in ``CLAUDE.md``::
+
+            path/
+              manifest.json
+              dataset_card.md
+              feature_dictionary.csv
+              tables/          # one .parquet per relational table
+              tasks/converted_within_90_days/{train,valid,test}.parquet
+              tasks/converted_within_90_days/task_manifest.json
+
+        Args:
+            path: Destination directory (created if absent).
+
+        Raises:
+            RuntimeError: if :attr:`simulation_result`, :attr:`population`,
+                or :attr:`world_graph` have not been populated (i.e. if
+                :meth:`~leadforge.api.generator.Generator.generate` was not
+                called).
+        """
+        from leadforge.api.bundle import write_bundle
+
+        write_bundle(self, path)
diff --git a/leadforge/render/manifests.py b/leadforge/render/manifests.py
new file mode 100644
index 0000000..fa8dc31
--- /dev/null
+++ b/leadforge/render/manifests.py
@@ -0,0 +1,104 @@
+"""Bundle manifest builder.
+
+:func:`build_manifest` constructs the ``manifest.json`` dict that is written
+at the root of every output bundle.  The manifest records provenance (recipe,
+seed, version, generation timestamp) and integrity metadata (row counts and
+SHA-256 hashes) for the Parquet data files: relational tables and task splits.
+"""
+
+from __future__ import annotations
+
+import hashlib
+import json
+from datetime import UTC, datetime
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+
+if TYPE_CHECKING:
+    from leadforge.core.models import GenerationConfig
+    from leadforge.structure.graph import WorldGraph
+
+# Bump this whenever the bundle layout or manifest schema changes.
+BUNDLE_SCHEMA_VERSION = "1"
+
+
+def build_manifest(
+    config: GenerationConfig,
+    world_graph: WorldGraph,
+    table_row_counts: dict[str, int],
+    task_row_counts: dict[str, dict[str, int]],
+    bundle_root: Path,
+    generation_timestamp: str | None = None,
+) -> dict[str, Any]:
+    """Build the bundle manifest dict.
+
+    SHA-256 hashes are computed by reading the written Parquet files from
+    *bundle_root*, so all table and task files must already exist on disk
+    before calling this function.
+
+    Args:
+        config: The resolved generation configuration.
+        world_graph: The sampled hidden world graph (provides motif_family).
+        table_row_counts: Mapping of table name → row count.
+        task_row_counts: Mapping of task_id → {split_name → row count}.
+        bundle_root: Root directory of the written bundle.
+        generation_timestamp: ISO-8601 UTC timestamp string.  Defaults to now.
+
+    Returns:
+        A JSON-serialisable dict ready to be written as ``manifest.json``.
+    """
+    if generation_timestamp is None:
+        generation_timestamp = datetime.now(UTC).isoformat(timespec="seconds")
+
+    # Build table entries with row counts and file hashes.
+    tables: dict[str, Any] = {}
+    for table_name, row_count in table_row_counts.items():
+        rel_path = f"tables/{table_name}.parquet"
+        abs_path = bundle_root / rel_path
+        sha = _sha256(abs_path)
+        tables[table_name] = {"row_count": row_count, "file": rel_path, "sha256": sha}
+
+    # Build task entries.
+    tasks: dict[str, Any] = {}
+    for task_id, split_counts in task_row_counts.items():
+        entry: dict[str, Any] = {}
+        for split_name, row_count in split_counts.items():
+            rel_path = f"tasks/{task_id}/{split_name}.parquet"
+            abs_path = bundle_root / rel_path
+            sha = _sha256(abs_path)
+            entry[f"{split_name}_rows"] = row_count
+            entry[f"{split_name}_sha256"] = sha
+        tasks[task_id] = entry
+
+    return {
+        "bundle_schema_version": BUNDLE_SCHEMA_VERSION,
+        "package_version": config.package_version,
+        "recipe_id": config.recipe_id,
+        "seed": config.seed,
+        "generation_timestamp": generation_timestamp,
+        "exposure_mode": config.exposure_mode.value,
+        "difficulty": config.difficulty.value,
+        "n_accounts": config.n_accounts,
+        "n_contacts": config.n_contacts,
+        "n_leads": config.n_leads,
+        "horizon_days": config.horizon_days,
+        "motif_family": world_graph.motif_family,
+        "tables": tables,
+        "tasks": tasks,
+    }
+
+
+def write_manifest(manifest: dict[str, Any], bundle_root: Path) -> Path:
+    """Serialise *manifest* to ``bundle_root/manifest.json`` and return the path."""
+    path = bundle_root / "manifest.json"
+    path.write_text(json.dumps(manifest, indent=2))
+    return path
+
+
+def _sha256(path: Path) -> str:
+    """Return the hex-encoded SHA-256 digest of *path*."""
+    h = hashlib.sha256()
+    with path.open("rb") as fh:
+        for chunk in iter(lambda: fh.read(65536), b""):
+            h.update(chunk)
+    return h.hexdigest()
diff --git a/leadforge/render/relational.py b/leadforge/render/relational.py
new file mode 100644
index 0000000..fb21578
--- /dev/null
+++ b/leadforge/render/relational.py
@@ -0,0 +1,84 @@
+"""Relational export — convert SimulationResult to typed DataFrames.
+
+:func:`to_dataframes` is the single entry point.  It produces one
+``pd.DataFrame`` per relational table, with dtypes matching the
+:attr:`~leadforge.schema.entities.AccountRow.DTYPE_MAP` of each entity
+class.  The resulting dict is consumed by the bundle writer to produce
+the ``tables/`` directory in the output bundle.
+"""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING, Literal, NamedTuple
+
+import pandas as pd
+
+from leadforge.schema.entities import (
+    AccountRow,
+    ContactRow,
+    CustomerRow,
+    EntityRowProtocol,
+    LeadRow,
+    OpportunityRow,
+    SalesActivityRow,
+    SessionRow,
+    SubscriptionRow,
+    TouchRow,
+)
+
+if TYPE_CHECKING:
+    from leadforge.simulation.engine import SimulationResult
+    from leadforge.simulation.population import PopulationResult
+
+_Source = Literal["population", "simulation"]
+
+
+class _TableSource(NamedTuple):
+    cls: type[EntityRowProtocol]
+    origin: _Source  # which object holds the rows
+    attr: str  # attribute name on that object
+
+
+# Maps table name → source descriptor.
+_TABLE_SOURCES: dict[str, _TableSource] = {
+    AccountRow.TABLE_NAME: _TableSource(AccountRow, "population", "accounts"),
+    ContactRow.TABLE_NAME: _TableSource(ContactRow, "population", "contacts"),
+    LeadRow.TABLE_NAME: _TableSource(LeadRow, "simulation", "leads"),
+    TouchRow.TABLE_NAME: _TableSource(TouchRow, "simulation", "touches"),
+    SessionRow.TABLE_NAME: _TableSource(SessionRow, "simulation", "sessions"),
+    SalesActivityRow.TABLE_NAME: _TableSource(SalesActivityRow, "simulation", "sales_activities"),
+    OpportunityRow.TABLE_NAME: _TableSource(OpportunityRow, "simulation", "opportunities"),
+    CustomerRow.TABLE_NAME: _TableSource(CustomerRow, "simulation", "customers"),
+    SubscriptionRow.TABLE_NAME: _TableSource(SubscriptionRow, "simulation", "subscriptions"),
+}
+
+
+def to_dataframes(
+    result: SimulationResult,
+    population: PopulationResult,
+) -> dict[str, pd.DataFrame]:
+    """Convert simulation output to one typed DataFrame per relational table.
+
+    Args:
+        result: Output of :func:`~leadforge.simulation.engine.simulate_world`.
+        population: Output of
+            :func:`~leadforge.simulation.population.build_population`.
+
+    Returns:
+        Dict mapping table name → ``pd.DataFrame`` with dtypes matching the
+        entity class's ``DTYPE_MAP``.  Empty tables are returned as zero-row
+        DataFrames with the correct schema.
+    """
+    dfs: dict[str, pd.DataFrame] = {}
+    for table_name, src in _TABLE_SOURCES.items():
+        obj = population if src.origin == "population" else result
+        rows = getattr(obj, src.attr)  # AttributeError surfaces missing attrs immediately
+        if rows:
+            df = pd.DataFrame([row.to_dict() for row in rows])
+            for col, dtype in src.cls.DTYPE_MAP.items():
+                if col in df.columns:
+                    df[col] = df[col].astype(dtype)
+        else:
+            df = src.cls.empty_dataframe()
+        dfs[table_name] = df
+    return dfs
diff --git a/leadforge/render/snapshots.py b/leadforge/render/snapshots.py
new file mode 100644
index 0000000..f43fbd6
--- /dev/null
+++ b/leadforge/render/snapshots.py
@@ -0,0 +1,186 @@
+"""Lead snapshot builder — flatten the simulated world into an ML-ready table.
+
+:func:`build_snapshot` produces one row per lead, containing the features
+defined in :data:`~leadforge.schema.features.LEAD_SNAPSHOT_FEATURES`.  All
+columns are anchored at or before the snapshot date (lead creation + horizon),
+preserving the leakage-free guarantee.
+
+The snapshot is the source table for the primary task export
+(``converted_within_90_days``).
+"""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import pandas as pd
+
+from leadforge.schema.entities import (
+    OpportunityRow,
+    SalesActivityRow,
+    SessionRow,
+    TouchRow,
+)
+from leadforge.schema.features import LEAD_SNAPSHOT_FEATURES
+
+if TYPE_CHECKING:
+    from leadforge.simulation.engine import SimulationResult
+    from leadforge.simulation.population import PopulationResult
+
+# Ordered column list and dtypes derived from the canonical feature spec.
+_SNAPSHOT_COLUMNS = [f.name for f in LEAD_SNAPSHOT_FEATURES]
+_SNAPSHOT_DTYPES = {f.name: f.dtype for f in LEAD_SNAPSHOT_FEATURES}
+
+# Join columns derived from the feature spec — single source of truth.
+# Adding a new account/contact feature to LEAD_SNAPSHOT_FEATURES automatically
+# includes it here without any manual list maintenance.
+_ACCOUNT_JOIN_COLS = [f.name for f in LEAD_SNAPSHOT_FEATURES if f.category == "account"]
+_CONTACT_JOIN_COLS = [f.name for f in LEAD_SNAPSHOT_FEATURES if f.category == "contact"]
+
+# Aggregated count columns that need zero-filling after left-merge.
+_INT_AGG_COLS = [
+    "touch_count",
+    "inbound_touch_count",
+    "outbound_touch_count",
+    "session_count",
+    "pricing_page_views",
+    "demo_page_views",
+    "total_session_duration_seconds",
+    "activity_count",
+]
+
+
+def build_snapshot(
+    result: SimulationResult,
+    population: PopulationResult,
+    horizon_days: int = 90,
+) -> pd.DataFrame:
+    """Build the lead snapshot DataFrame from simulation output.
+
+    One row is produced per lead.  Features are computed by aggregating
+    touches, sessions, and sales activities that occurred during the
+    simulation horizon.  The snapshot anchor date is
+    ``lead_created_at + timedelta(days=horizon_days)``.
+
+    Args:
+        result: Output of :func:`~leadforge.simulation.engine.simulate_world`.
+        population: Output of
+            :func:`~leadforge.simulation.population.build_population`.
+        horizon_days: Simulation horizon length.  Defaults to 90.
+
+    Returns:
+        A ``pd.DataFrame`` with the columns specified in
+        :data:`~leadforge.schema.features.LEAD_SNAPSHOT_FEATURES` and dtypes
+        matching the feature spec.  Row order matches ``result.leads``.
+    """
+    # -------------------------------------------------------------------
+    # Aggregate event tables by lead_id using pandas for efficiency.
+    # Empty event lists fall back to the entity's canonical empty DataFrame
+    # so groupby always produces the correct output column names.
+    # -------------------------------------------------------------------
+
+    # Touch aggregates
+    td = (
+        pd.DataFrame([t.to_dict() for t in result.touches])
+        if result.touches
+        else TouchRow.empty_dataframe()
+    )
+    touch_agg = (
+        td.groupby("lead_id")
+        .agg(
+            touch_count=("touch_id", "count"),
+            inbound_touch_count=(
+                "touch_direction",
+                lambda s: int((s == "inbound").sum()),
+            ),
+            outbound_touch_count=(
+                "touch_direction",
+                lambda s: int((s == "outbound").sum()),
+            ),
+            last_touch_timestamp=("touch_timestamp", "max"),
+        )
+        .reset_index()
+    )
+
+    # Session aggregates
+    sd = (
+        pd.DataFrame([s.to_dict() for s in result.sessions])
+        if result.sessions
+        else SessionRow.empty_dataframe()
+    )
+    sess_agg = (
+        sd.groupby("lead_id")
+        .agg(
+            session_count=("session_id", "count"),
+            pricing_page_views=("pricing_page_views", "sum"),
+            demo_page_views=("demo_page_views", "sum"),
+            total_session_duration_seconds=("session_duration_seconds", "sum"),
+        )
+        .reset_index()
+    )
+
+    # Sales activity aggregates
+    ad = (
+        pd.DataFrame([a.to_dict() for a in result.sales_activities])
+        if result.sales_activities
+        else SalesActivityRow.empty_dataframe()
+    )
+    act_agg = ad.groupby("lead_id").agg(activity_count=("activity_id", "count")).reset_index()
+
+    # Opportunity join: find open (unclosed) opportunity per lead.
+    od = (
+        pd.DataFrame([o.to_dict() for o in result.opportunities])
+        if result.opportunities
+        else OpportunityRow.empty_dataframe()
+    )
+    open_opps = od[od["close_outcome"].isna()][["lead_id", "estimated_acv"]]
+    open_opps = open_opps.groupby("lead_id").first().reset_index()
+    open_opps = open_opps.rename(columns={"estimated_acv": "opportunity_estimated_acv"})
+    open_opps["has_open_opportunity"] = True
+
+    # -------------------------------------------------------------------
+    # Build base lead DataFrame and join aggregates.
+    # -------------------------------------------------------------------
+    lead_df = pd.DataFrame([lead.to_dict() for lead in result.leads])
+
+    # Compute snapshot anchor date (per lead, vectorised).
+    lead_df["anchor_date"] = pd.to_datetime(lead_df["lead_created_at"]) + pd.Timedelta(
+        days=horizon_days
+    )
+
+    # Join aggregates (left join preserves all leads).
+    lead_df = lead_df.merge(touch_agg, on="lead_id", how="left")
+    lead_df = lead_df.merge(sess_agg, on="lead_id", how="left")
+    lead_df = lead_df.merge(act_agg, on="lead_id", how="left")
+    lead_df = lead_df.merge(open_opps, on="lead_id", how="left")
+
+    # Fill missing event aggregate counts with zero; has_open_opportunity with False.
+    # opportunity_estimated_acv and days_since_last_touch intentionally stay NaN.
+    lead_df[_INT_AGG_COLS] = lead_df[_INT_AGG_COLS].fillna(0)
+    opp_mask = lead_df["has_open_opportunity"].notna()
+    lead_df["has_open_opportunity"] = lead_df["has_open_opportunity"].where(opp_mask, other=False)
+
+    # Compute days_since_last_touch fully vectorised.
+    # pd.to_datetime returns NaT for nulls; (Timestamp - NaT) yields NaN naturally.
+    last_ts = pd.to_datetime(lead_df["last_touch_timestamp"])
+    lead_df["days_since_last_touch"] = (lead_df["anchor_date"] - last_ts).dt.days
+
+    # -------------------------------------------------------------------
+    # Join account and contact features via vectorised merge (not apply).
+    # Columns are derived from LEAD_SNAPSHOT_FEATURES categories so this
+    # list stays in sync automatically when the feature spec changes.
+    # -------------------------------------------------------------------
+    acct_df = pd.DataFrame([a.to_dict() for a in population.accounts])[_ACCOUNT_JOIN_COLS]
+    cont_df = pd.DataFrame([c.to_dict() for c in population.contacts])[_CONTACT_JOIN_COLS]
+    lead_df = lead_df.merge(acct_df, on="account_id", how="left")
+    lead_df = lead_df.merge(cont_df, on="contact_id", how="left")
+
+    # -------------------------------------------------------------------
+    # Select, order, and cast columns — single authoritative dtype pass.
+    # -------------------------------------------------------------------
+    snapshot = lead_df[_SNAPSHOT_COLUMNS].copy()
+    for col, dtype in _SNAPSHOT_DTYPES.items():
+        if col in snapshot.columns:
+            snapshot[col] = snapshot[col].astype(dtype)
+
+    return snapshot
diff --git a/leadforge/render/tasks.py b/leadforge/render/tasks.py
new file mode 100644
index 0000000..7d6013c
--- /dev/null
+++ b/leadforge/render/tasks.py
@@ -0,0 +1,77 @@
+"""Task export — deterministic train/valid/test split and Parquet output.
+
+:func:`write_task_splits` takes the lead snapshot DataFrame, shuffles it
+deterministically, splits it according to the task manifest ratios, and
+writes the three Parquet files plus a ``task_manifest.json`` into the
+tasks directory.
+"""
+
+from __future__ import annotations
+
+import json
+from pathlib import Path
+
+import pandas as pd
+
+from leadforge.core.rng import RNGRoot
+from leadforge.schema.tasks import CONVERTED_WITHIN_90_DAYS, TaskManifest
+
+
+def write_task_splits(
+    snapshot: pd.DataFrame,
+    out_dir: Path,
+    *,
+    seed: int,
+    task: TaskManifest = CONVERTED_WITHIN_90_DAYS,
+) -> dict[str, int]:
+    """Shuffle, split, and write snapshot Parquet files for *task*.
+
+    Files written under ``out_dir / task.task_id /``::
+
+        train.parquet
+        valid.parquet
+        test.parquet
+        task_manifest.json
+
+    Args:
+        snapshot: Lead snapshot DataFrame from
+            :func:`~leadforge.render.snapshots.build_snapshot`.
+        out_dir: Parent directory for task outputs (typically
+            ``bundle_root / "tasks"``).
+        seed: Seed used for deterministic row shuffle.
+        task: Task manifest describing the split ratios and label column.
+
+    Returns:
+        Dict mapping split name (``"train"``, ``"valid"``, ``"test"``) to
+        the number of rows written.
+    """
+    task_dir = out_dir / task.task_id
+    task_dir.mkdir(parents=True, exist_ok=True)
+
+    # Deterministic shuffle via the project's RNG substream system.
+    rng = RNGRoot(seed).child("task_split_shuffle")
+    indices = list(range(len(snapshot)))
+    rng.shuffle(indices)
+    shuffled = snapshot.iloc[indices].reset_index(drop=True)
+
+    n = len(shuffled)
+    n_train = int(n * task.split.train)
+    n_valid = int(n * task.split.valid)
+
+    splits: dict[str, pd.DataFrame] = {
+        "train": shuffled.iloc[:n_train],
+        "valid": shuffled.iloc[n_train : n_train + n_valid],
+        "test": shuffled.iloc[n_train + n_valid :],  # remainder avoids rounding off-by-one
+    }
+
+    row_counts: dict[str, int] = {}
+    for split_name, df in splits.items():
+        path = task_dir / f"{split_name}.parquet"
+        df.to_parquet(path, index=False, engine="pyarrow")
+        row_counts[split_name] = len(df)
+
+    # Write task_manifest.json alongside the Parquet files.
+    manifest_path = task_dir / "task_manifest.json"
+    manifest_path.write_text(json.dumps(task.to_dict(), indent=2))
+
+    return row_counts
diff --git a/leadforge/schema/entities.py b/leadforge/schema/entities.py
index 2a60a7c..d97230a 100644
--- a/leadforge/schema/entities.py
+++ b/leadforge/schema/entities.py
@@ -18,11 +18,26 @@
 from __future__ import annotations
 
 from dataclasses import dataclass, fields
-from typing import Any, ClassVar
+from typing import Any, ClassVar, Protocol
 
 import pandas as pd
 
 
+class EntityRowProtocol(Protocol):
+    """Structural protocol shared by all entity row dataclasses.
+
+    Allows typed dispatch in render code without coupling to concrete classes.
+    """
+
+    TABLE_NAME: ClassVar[str]
+    DTYPE_MAP: ClassVar[dict[str, str]]
+
+    def to_dict(self) -> dict[str, Any]: ...
+
+    @classmethod
+    def empty_dataframe(cls) -> pd.DataFrame: ...
+
+
 def _empty_df(dtype_map: dict[str, str]) -> pd.DataFrame:
     """Return a zero-row DataFrame with columns ordered as *dtype_map*."""
     return pd.DataFrame({col: pd.array([], dtype=dtype) for col, dtype in dtype_map.items()})
@@ -360,7 +375,7 @@ def empty_dataframe(cls) -> pd.DataFrame:
 # Registry
 # ---------------------------------------------------------------------------
 
-ALL_ROW_TYPES: tuple[type, ...] = (
+ALL_ROW_TYPES: tuple[type[EntityRowProtocol], ...] = (
     AccountRow,
     ContactRow,
     LeadRow,
@@ -372,4 +387,4 @@ def empty_dataframe(cls) -> pd.DataFrame:
     SubscriptionRow,
 )
 
-TABLE_NAMES: tuple[str, ...] = tuple(cls.TABLE_NAME for cls in ALL_ROW_TYPES)  # type: ignore[attr-defined]
+TABLE_NAMES: tuple[str, ...] = tuple(cls.TABLE_NAME for cls in ALL_ROW_TYPES)
diff --git a/tests/api/test_generator.py b/tests/api/test_generator.py
index b7c2b1b..05e896e 100644
--- a/tests/api/test_generator.py
+++ b/tests/api/test_generator.py
@@ -60,10 +60,35 @@ def test_from_recipe_invalid_id_raises() -> None:
         Generator.from_recipe("does_not_exist")
 
 
-def test_generate_not_implemented() -> None:
-    gen = Generator.from_recipe("b2b_saas_procurement_v1")
-    with pytest.raises(NotImplementedError):
-        gen.generate()
+def test_generate_returns_world_bundle() -> None:
+    from leadforge.core.models import WorldBundle
+
+    gen = Generator.from_recipe("b2b_saas_procurement_v1", seed=42)
+    bundle = gen.generate(n_leads=30, n_accounts=15, n_contacts=45)
+    assert isinstance(bundle, WorldBundle)
+    assert bundle.simulation_result is not None
+    assert bundle.population is not None
+
+
+def test_generate_respects_recipe_difficulty_when_not_overridden() -> None:
+    """Calling generate() without difficulty must not silently override the recipe's setting."""
+    from leadforge.core.enums import DifficultyProfile
+
+    gen = Generator.from_recipe("b2b_saas_procurement_v1", difficulty="advanced")
+    assert gen.config.difficulty == DifficultyProfile.advanced
+    bundle = gen.generate(n_leads=20, n_accounts=10, n_contacts=30)
+    assert bundle.spec.config.difficulty == DifficultyProfile.advanced
+
+
+def test_generate_explicit_difficulty_overrides_recipe() -> None:
+    """An explicit difficulty kwarg must override the recipe setting for that call only."""
+    from leadforge.core.enums import DifficultyProfile
+
+    gen = Generator.from_recipe("b2b_saas_procurement_v1", difficulty="advanced")
+    bundle = gen.generate(n_leads=20, n_accounts=10, n_contacts=30, difficulty="intro")
+    assert bundle.spec.config.difficulty == DifficultyProfile.intro
+    # Generator itself is unchanged.
+    assert gen.config.difficulty == DifficultyProfile.advanced
 
 
 def test_from_recipe_config_has_package_version() -> None:
diff --git a/tests/render/__init__.py b/tests/render/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/tests/render/test_render.py b/tests/render/test_render.py
new file mode 100644
index 0000000..18df3cd
--- /dev/null
+++ b/tests/render/test_render.py
@@ -0,0 +1,475 @@
+"""Tests for the render layer: relational.py, snapshots.py, tasks.py, manifests.py."""
+
+from __future__ import annotations
+
+import json
+
+import pandas as pd
+import pytest
+
+from leadforge.core.models import GenerationConfig
+from leadforge.schema.features import LEAD_SNAPSHOT_FEATURES
+from leadforge.simulation.engine import simulate_world
+from leadforge.simulation.population import build_population
+from leadforge.structure.sampler import sample_hidden_graph
+
+# ---------------------------------------------------------------------------
+# Shared fixtures
+# ---------------------------------------------------------------------------
+
+_SNAPSHOT_COLUMNS = [f.name for f in LEAD_SNAPSHOT_FEATURES]
+_SNAPSHOT_DTYPES = {f.name: f.dtype for f in LEAD_SNAPSHOT_FEATURES}
+
+
+def _make_config(seed: int = 42, n_leads: int = 80) -> GenerationConfig:
+    return GenerationConfig(seed=seed, n_accounts=30, n_contacts=90, n_leads=n_leads)
+
+
+def _make_narrative(seed: int = 42):
+    from leadforge.api.generator import Generator
+
+    gen = Generator.from_recipe("b2b_saas_procurement_v1", seed=seed)
+    assert gen.world_spec.narrative is not None
+    return gen.world_spec.narrative
+
+
+@pytest.fixture(scope="module")
+def sim_outputs():
+    """Run a small simulation once; share across all tests in this module."""
+    config = _make_config()
+    narrative = _make_narrative(config.seed)
+    graph = sample_hidden_graph(42)
+    population = build_population(config, narrative, graph)
+    result = simulate_world(config, population, graph)
+    return config, population, result, graph
+
+
+# ---------------------------------------------------------------------------
+# render/relational.py
+# ---------------------------------------------------------------------------
+
+
+class TestToDataframes:
+    def test_returns_all_table_names(self, sim_outputs):
+        _, population, result, _ = sim_outputs
+        from leadforge.render.relational import to_dataframes
+
+        dfs = to_dataframes(result, population)
+        expected = {
+            "accounts",
+            "contacts",
+            "leads",
+            "touches",
+            "sessions",
+            "sales_activities",
+            "opportunities",
+            "customers",
+            "subscriptions",
+        }
+        assert set(dfs.keys()) == expected
+
+    def test_lead_count_matches(self, sim_outputs):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.relational import to_dataframes
+
+        dfs = to_dataframes(result, population)
+        assert len(dfs["leads"]) == config.n_leads
+
+    def test_account_and_contact_counts(self, sim_outputs):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.relational import to_dataframes
+
+        dfs = to_dataframes(result, population)
+        assert len(dfs["accounts"]) == config.n_accounts
+        assert len(dfs["contacts"]) == config.n_contacts
+
+    def test_dataframes_are_dataframes(self, sim_outputs):
+        _, population, result, _ = sim_outputs
+        from leadforge.render.relational import to_dataframes
+
+        dfs = to_dataframes(result, population)
+        for name, df in dfs.items():
+            assert isinstance(df, pd.DataFrame), f"{name} is not a DataFrame"
+
+    def test_empty_tables_have_schema(self, sim_outputs):
+        """Tables with zero rows must still expose the correct column names."""
+        _, population, result, _ = sim_outputs
+        from leadforge.render.relational import to_dataframes
+        from leadforge.schema.entities import CustomerRow
+
+        dfs = to_dataframes(result, population)
+        assert set(CustomerRow.DTYPE_MAP.keys()).issubset(set(dfs["customers"].columns))
+
+    def test_fk_integrity(self, sim_outputs):
+        """All FK constraints must hold on the produced DataFrames."""
+        _, population, result, _ = sim_outputs
+        from leadforge.render.relational import to_dataframes
+        from leadforge.schema.relationships import ALL_CONSTRAINTS, validate_fk
+
+        dfs = to_dataframes(result, population)
+        for constraint in ALL_CONSTRAINTS:
+            child_df = dfs.get(constraint.child_table)
+            parent_df = dfs.get(constraint.parent_table)
+            if child_df is None or parent_df is None or child_df.empty:
+                continue
+            validate_fk(
+                child_values=child_df[constraint.child_column].dropna().tolist(),
+                parent_values=set(parent_df[constraint.parent_column].tolist()),
+                constraint=constraint,
+            )
+
+    def test_deterministic_under_same_seed(self):
+        """Same seed → identical relational DataFrames."""
+        from leadforge.render.relational import to_dataframes
+
+        def _run(seed):
+            cfg = _make_config(seed=seed)
+            narr = _make_narrative(seed)
+            g = sample_hidden_graph(seed)
+            pop = build_population(cfg, narr, g)
+            res = simulate_world(cfg, pop, g)
+            return to_dataframes(res, pop)
+
+        dfs1 = _run(77)
+        dfs2 = _run(77)
+        for tbl in ("leads", "accounts", "touches"):
+            pd.testing.assert_frame_equal(dfs1[tbl], dfs2[tbl], check_like=False)
+
+
+# ---------------------------------------------------------------------------
+# render/snapshots.py
+# ---------------------------------------------------------------------------
+
+
+class TestBuildSnapshot:
+    def test_row_count_equals_lead_count(self, sim_outputs):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+        assert len(snap) == config.n_leads
+
+    def test_all_snapshot_columns_present(self, sim_outputs):
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        for col in _SNAPSHOT_COLUMNS:
+            assert col in snap.columns, f"Missing column: {col}"
+
+    def test_no_extra_columns(self, sim_outputs):
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        assert set(snap.columns) == set(_SNAPSHOT_COLUMNS)
+
+    def test_target_column_is_boolean(self, sim_outputs):
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        assert snap["converted_within_90_days"].dtype.name == "boolean"
+
+    def test_touch_counts_non_negative(self, sim_outputs):
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        assert (snap["touch_count"].dropna() >= 0).all()
+        assert (snap["inbound_touch_count"].dropna() >= 0).all()
+        assert (snap["outbound_touch_count"].dropna() >= 0).all()
+
+    def test_inbound_plus_outbound_equals_total(self, sim_outputs):
+        """inbound + outbound must equal touch_count exactly (only two directions in v1)."""
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        valid = snap[["touch_count", "inbound_touch_count", "outbound_touch_count"]].dropna()
+        combined = valid["inbound_touch_count"] + valid["outbound_touch_count"]
+        assert (combined == valid["touch_count"]).all()
+
+    def test_days_since_last_touch_finite_when_touches_exist(self, sim_outputs):
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        has_touch = snap["touch_count"] > 0
+        if has_touch.any():
+            assert snap.loc[has_touch, "days_since_last_touch"].notna().all()
+
+    def test_no_post_anchor_columns_in_snapshot(self, sim_outputs):
+        """Columns that represent post-anchor truth must not appear in the snapshot."""
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        # These exist in LeadRow / OpportunityRow but must be excluded (leakage rule).
+        forbidden = {"conversion_timestamp", "closed_at", "close_outcome"}
+        assert forbidden.isdisjoint(set(snap.columns))
+
+    def test_target_matches_simulation_result(self, sim_outputs):
+        """converted_within_90_days in snapshot must match SimulationResult's flag."""
+        _, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+
+        snap = build_snapshot(result, population)
+        lead_flags = {row.lead_id: row.converted_within_90_days for row in result.leads}
+        snap_flags = dict(zip(snap["lead_id"], snap["converted_within_90_days"], strict=False))
+        for lid, flag in lead_flags.items():
+            assert snap_flags[lid] == flag, f"Mismatch on {lid}"
+
+    def test_deterministic_under_same_seed(self):
+        """Same seed → identical snapshots."""
+        from leadforge.render.snapshots import build_snapshot
+
+        def _snap(seed):
+            cfg = _make_config(seed=seed)
+            narr = _make_narrative(seed)
+            g = sample_hidden_graph(seed)
+            pop = build_population(cfg, narr, g)
+            res = simulate_world(cfg, pop, g)
+            return build_snapshot(res, pop, horizon_days=cfg.horizon_days)
+
+        s1 = _snap(13)
+        s2 = _snap(13)
+        pd.testing.assert_frame_equal(s1, s2, check_like=False)
+
+
+# ---------------------------------------------------------------------------
+# render/tasks.py
+# ---------------------------------------------------------------------------
+
+
+class TestWriteTaskSplits:
+    def test_three_files_written(self, sim_outputs, tmp_path):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+        from leadforge.render.tasks import write_task_splits
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+        write_task_splits(snap, tmp_path, seed=config.seed)
+
+        task_dir = tmp_path / "converted_within_90_days"
+        for split in ("train", "valid", "test"):
+            assert (task_dir / f"{split}.parquet").exists(), f"{split}.parquet missing"
+
+    def test_task_manifest_written(self, sim_outputs, tmp_path):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+        from leadforge.render.tasks import write_task_splits
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+        write_task_splits(snap, tmp_path, seed=config.seed)
+
+        manifest_path = tmp_path / "converted_within_90_days" / "task_manifest.json"
+        assert manifest_path.exists()
+        data = json.loads(manifest_path.read_text())
+        assert "task_id" in data
+
+    def test_row_counts_sum_to_total(self, sim_outputs, tmp_path):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+        from leadforge.render.tasks import write_task_splits
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+        counts = write_task_splits(snap, tmp_path, seed=config.seed)
+
+        assert counts["train"] + counts["valid"] + counts["test"] == len(snap)
+
+    def test_split_ratios_approx(self, sim_outputs, tmp_path):
+        """Train ≈ 70%, valid ≈ 15%, test ≈ 15% (±5% tolerance for small samples)."""
+        config, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+        from leadforge.render.tasks import write_task_splits
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+        counts = write_task_splits(snap, tmp_path, seed=config.seed)
+        n = len(snap)
+        assert counts["train"] / n == pytest.approx(0.70, abs=0.05)
+        assert counts["valid"] / n == pytest.approx(0.15, abs=0.05)
+        assert counts["test"] / n == pytest.approx(0.15, abs=0.05)
+
+    def test_splits_are_disjoint(self, sim_outputs, tmp_path):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+        from leadforge.render.tasks import write_task_splits
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+        write_task_splits(snap, tmp_path, seed=config.seed)
+
+        task_dir = tmp_path / "converted_within_90_days"
+        dfs = {s: pd.read_parquet(task_dir / f"{s}.parquet") for s in ("train", "valid", "test")}
+        ids = {s: set(dfs[s]["lead_id"]) for s in dfs}
+        assert ids["train"].isdisjoint(ids["valid"])
+        assert ids["train"].isdisjoint(ids["test"])
+        assert ids["valid"].isdisjoint(ids["test"])
+
+    def test_deterministic_under_same_seed(self, sim_outputs, tmp_path):
+        config, population, result, _ = sim_outputs
+        from leadforge.render.snapshots import build_snapshot
+        from leadforge.render.tasks import write_task_splits
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+
+        p1 = tmp_path / "run1"
+        p2 = tmp_path / "run2"
+        c1 = write_task_splits(snap, p1, seed=config.seed)
+        c2 = write_task_splits(snap, p2, seed=config.seed)
+        assert c1 == c2
+
+        task_id = "converted_within_90_days"
+        for split in ("train", "valid", "test"):
+            df1 = pd.read_parquet(p1 / task_id / f"{split}.parquet")
+            df2 = pd.read_parquet(p2 / task_id / f"{split}.parquet")
+            pd.testing.assert_frame_equal(df1, df2)
+
+
+# ---------------------------------------------------------------------------
+# render/manifests.py
+# ---------------------------------------------------------------------------
+
+
+class TestBuildManifest:
+    def _make_manifest(self, sim_outputs, tmp_path):
+        config, population, result, world_graph = sim_outputs
+        from leadforge.render.manifests import build_manifest
+        from leadforge.render.relational import to_dataframes
+        from leadforge.render.snapshots import build_snapshot
+        from leadforge.render.tasks import write_task_splits
+        from leadforge.schema.tables import write_parquet
+
+        tables_dir = tmp_path / "tables"
+        tables_dir.mkdir()
+        dfs = to_dataframes(result, population)
+        table_row_counts = {}
+        for name, df in dfs.items():
+            write_parquet(df, tables_dir / f"{name}.parquet")
+            table_row_counts[name] = len(df)
+
+        snap = build_snapshot(result, population, horizon_days=config.horizon_days)
+        task_counts = write_task_splits(snap, tmp_path / "tasks", seed=config.seed)
+
+        manifest = build_manifest(
+            config=config,
+            world_graph=world_graph,
+            table_row_counts=table_row_counts,
+            task_row_counts={"converted_within_90_days": task_counts},
+            bundle_root=tmp_path,
+        )
+        return manifest
+
+    def test_required_top_level_keys(self, sim_outputs, tmp_path):
+        manifest = self._make_manifest(sim_outputs, tmp_path)
+        required = {
+            "bundle_schema_version",
+            "package_version",
+            "recipe_id",
+            "seed",
+            "generation_timestamp",
+            "exposure_mode",
+            "difficulty",
+            "n_accounts",
+            "n_contacts",
+            "n_leads",
+            "horizon_days",
+            "motif_family",
+            "tables",
+            "tasks",
+        }
+        assert required.issubset(set(manifest.keys()))
+
+    def test_table_row_counts_match(self, sim_outputs, tmp_path):
+        config, _, _, _ = sim_outputs
+        manifest = self._make_manifest(sim_outputs, tmp_path)
+        assert manifest["tables"]["leads"]["row_count"] == config.n_leads
+        assert manifest["tables"]["accounts"]["row_count"] == config.n_accounts
+        assert manifest["tables"]["contacts"]["row_count"] == config.n_contacts
+
+    def test_sha256_populated(self, sim_outputs, tmp_path):
+        manifest = self._make_manifest(sim_outputs, tmp_path)
+        for tbl, entry in manifest["tables"].items():
+            assert isinstance(entry["sha256"], str), f"{tbl} sha256 is not a string"
+            assert len(entry["sha256"]) == 64, f"{tbl} sha256 has wrong length"
+
+    def test_task_split_counts_present(self, sim_outputs, tmp_path):
+        manifest = self._make_manifest(sim_outputs, tmp_path)
+        task = manifest["tasks"]["converted_within_90_days"]
+        assert "train_rows" in task
+        assert "valid_rows" in task
+        assert "test_rows" in task
+
+    def test_seed_and_recipe_recorded(self, sim_outputs, tmp_path):
+        config, _, _, _ = sim_outputs
+        manifest = self._make_manifest(sim_outputs, tmp_path)
+        assert manifest["seed"] == config.seed
+        assert manifest["recipe_id"] == config.recipe_id
+
+    def test_manifest_is_json_serialisable(self, sim_outputs, tmp_path):
+        manifest = self._make_manifest(sim_outputs, tmp_path)
+        dumped = json.dumps(manifest)
+        reloaded = json.loads(dumped)
+        assert reloaded["seed"] == manifest["seed"]
+
+
+# ---------------------------------------------------------------------------
+# api/bundle.py — integration smoke test
+# ---------------------------------------------------------------------------
+
+
+class TestWriteBundle:
+    def test_full_bundle_written(self, sim_outputs, tmp_path):
+        config, population, result, world_graph = sim_outputs
+        from leadforge.api.bundle import write_bundle
+        from leadforge.core.models import WorldBundle, WorldSpec
+
+        bundle = WorldBundle(
+            spec=WorldSpec(config=config),
+            population=population,
+            simulation_result=result,
+            world_graph=world_graph,
+        )
+        write_bundle(bundle, str(tmp_path))
+
+        assert (tmp_path / "manifest.json").exists()
+        assert (tmp_path / "dataset_card.md").exists()
+        assert (tmp_path / "feature_dictionary.csv").exists()
+        assert (tmp_path / "tables").is_dir()
+        assert (tmp_path / "tasks" / "converted_within_90_days").is_dir()
+
+    def test_manifest_is_valid_json(self, sim_outputs, tmp_path):
+        config, population, result, world_graph = sim_outputs
+        from leadforge.api.bundle import write_bundle
+        from leadforge.core.models import WorldBundle, WorldSpec
+
+        bundle = WorldBundle(
+            spec=WorldSpec(config=config),
+            population=population,
+            simulation_result=result,
+            world_graph=world_graph,
+        )
+        write_bundle(bundle, str(tmp_path))
+
+        data = json.loads((tmp_path / "manifest.json").read_text())
+        assert data["seed"] == config.seed
+
+    def test_unpopulated_bundle_raises(self, tmp_path):
+        from leadforge.api.bundle import write_bundle
+        from leadforge.core.models import WorldBundle
+
+        with pytest.raises(RuntimeError, match="not fully populated"):
+            write_bundle(WorldBundle(), str(tmp_path))
+
+    def test_generator_generate_and_save(self, tmp_path):
+        """End-to-end: Generator.from_recipe → generate → save."""
+        from leadforge.api.generator import Generator
+
+        gen = Generator.from_recipe("b2b_saas_procurement_v1", seed=7)
+        bundle = gen.generate(n_leads=60, n_accounts=20, n_contacts=60)
+        bundle.save(str(tmp_path))
+
+        assert (tmp_path / "manifest.json").exists()
+        manifest = json.loads((tmp_path / "manifest.json").read_text())
+        assert manifest["n_leads"] == 60
+        assert manifest["seed"] == 7