diff --git a/CHANGELOG.md b/CHANGELOG.md
new file mode 100644
index 0000000..322315a
--- /dev/null
+++ b/CHANGELOG.md
@@ -0,0 +1,82 @@
+# Changelog
+
+All notable changes to **datorcloud** are documented in this file. The
+format follows [Keep a Changelog](https://keepachangelog.com/en/1.1.0/)
+and the version numbers follow [Semantic Versioning](https://semver.org).
+
+## [0.2.0] - 2026-05-27
+
+Phase 1 of the DORIS integration plan landed: the layered L1-L4 catalog,
+the formal `(I, C, Q, F)` operators, and the L4 snapshot freeze.
+
+### Added
+
+- **L1-L4 catalog DDL** (`datorcloud/schemas/l1_l4.sql`,
+  `schema_version: 1.0.0`). Idempotent. L1 unique key includes
+  `study_id` so DICOM rows with multiple studies per subject do not
+  collide. L2 is keyed on `(record_uid, modality, sequence)` so
+  compound CVPR modality strings split losslessly. New ENUMs:
+  `privacy_class`, `annotation_kind`, `instance_label`,
+  `processing_stage`. New L1 companion tables: `l1_citations`,
+  `l1_processing` (CVPR ingest provenance, `cvpr_folder` column on
+  `l1_experiment`). New L4 tables: `l4_cohort_snapshot` (with
+  `l13_payload` Parquet blob + `catalog_sha256` + `hf_publication_log`
+  reserved for Phase 3) and `l4_eval_set` (annotator columns, target
+  labels, inter-observer quantiles; per design invariant I3 multiple
+  eval sets may reference one snapshot).
+- **`datorcloud.schemas.Migration`** runner with a stable
+  `schema_sha` digest computed from the canonical DDL text. Apply is
+  idempotent (`schema_sha` stable across two runs).
+- **`ParquetCatalogComponent`** (`datorcloud/components/parquet_catalog_component.py`),
+  replacing `metadata_storage_component.py`. Hive-partitioned by
+  `dataset_id` + `dataset_version` for L1-L3 layers under
+  `<base>/<layer>/dataset_id=<id>/dataset_version=<v>/part.parquet`,
+  flat layout for L4 tables. Canonical views `v_doris` and
+  `v_doris_egress` (license / privacy filtered) materialised at
+  construction.
+- **Formal `(I, C, Q, F)` operators on `DatorCloudOrchestrator`** -
+  `ingest(layer, df)`, `query(sql=...)` or
+  `query(view=..., filters=...)`, `snapshot_cohort(...)`,
+  `create_eval_set(...)`, `fetch(snapshot_id, dest)`. `from_env()`
+  factory and `.env` contract unchanged; new optional
+  `DATORCLOUD_CATALOG_URI` env var picks the catalog root.
+- **L4 snapshot freeze** (`datorcloud/snapshots.py`). At
+  `snapshot_cohort()` time, the matched L1-L3 rows are deep-copied into
+  a single Parquet blob, hashed over a deterministic canonical
+  serialisation into `catalog_sha256`, and persisted. The hash is stable
+  across reruns even after `l2_sensor.converted_uri` is updated between
+  two consecutive snapshots (the gate that integration-test
+  `doris-it-01-catalog` assertion (c) checks).
+- **CLI verb** `datorcloud query --sql "SELECT ... FROM v_doris"` runs
+  end-to-end against the new L1-L4 catalog without MinIO credentials.
+- **Integration test** `tests/integration/test_01_catalog.py`
+  (`doris-it-01-catalog`) covering assertions (a)-(f) of
+  STEP_BY_STEP_PLAN.md §3.
+
+### Changed
+
+- `DatorCloudOrchestrator.__init__` now accepts an optional
+  `parquet_catalog=` and `catalog_base_uri=` argument. Existing
+  callers continue to work unchanged; the new path is opt-in.
+- `pyproject.toml` declares `pyarrow>=14` as a runtime dependency
+  (used by the snapshot freeze) and adds package-data for
+  `datorcloud.schemas/*.sql`.
+
+### Documentation
+
+- `docs/snapshots.md` describes the snapshot-freeze semantics, the
+  canonical-serialisation hashing rule, and the L4 eval-set join
+  surface that the T2D inter-observer pipeline reads in Phase 5.
+
+### Migration notes (downstream)
+
+- Downstream pins to `datorcloud>=0.2.0`. `msk-ai-trust-to-deploy`
+  bumped its requirement in `pyproject.toml`.
+- The legacy `metadata_storage_component` remains importable but is
+  superseded by `ParquetCatalogComponent` for any new code path. It
+  will be removed no earlier than `0.3.0`.
+
+## [0.1.0] - 2026-05-15
+
+- Initial public release: component-oriented framework for MinIO
+  object storage, DuckDB-backed CSV queries, and Dagster assets.
diff --git a/datorcloud/__init__.py b/datorcloud/__init__.py
index 89f3eae..0e12456 100644
--- a/datorcloud/__init__.py
+++ b/datorcloud/__init__.py
@@ -5,11 +5,20 @@
     MetadataStorageComponent,
     MinioObjectComponent,
     ObjectRetrievalComponent,
+    ParquetCatalogComponent,
     QueryComponent,
 )
 from .core import DatorCloudOrchestrator
+from .schemas import SCHEMA_VERSION as L1_L4_SCHEMA_VERSION
+from .snapshots import (
+    EvalSet,
+    Snapshot,
+    create_eval_set,
+    load_snapshot_payload,
+    snapshot_cohort,
+)
 
-__version__ = "0.1.0"
+__version__ = "0.2.0"
 
 __all__ = [
     "DatorCloudOrchestrator",
@@ -17,6 +26,13 @@
     "MetadataStorageComponent",
     "MinioObjectComponent",
     "ObjectRetrievalComponent",
+    "ParquetCatalogComponent",
     "QueryComponent",
+    "Snapshot",
+    "EvalSet",
+    "snapshot_cohort",
+    "create_eval_set",
+    "load_snapshot_payload",
+    "L1_L4_SCHEMA_VERSION",
     "__version__",
 ]
diff --git a/datorcloud/cli.py b/datorcloud/cli.py
index fcfc33d..3e2cfdf 100644
--- a/datorcloud/cli.py
+++ b/datorcloud/cli.py
@@ -65,20 +65,26 @@ def _parse_filters(values: Optional[Sequence[str]]) -> Dict[str, Any]:
     return out
 
 
-def _build_orchestrator(args: argparse.Namespace) -> DatorCloudOrchestrator:
+def _build_orchestrator(
+    args: argparse.Namespace, *, require_minio: bool = True
+) -> DatorCloudOrchestrator:
     """Construct the orchestrator from CLI args.
 
     CLI defaults pull from the environment (which has been populated by
     ``load_dotenv()`` above) without hard-coding any credentials. Missing
     credentials surface as a clear ``ValueError`` from the underlying
     components.
+
+    The catalog-only verbs (``query --sql``, ``snapshot``, etc.) pass
+    ``require_minio=False`` so callers can drive the L1-L4 catalog
+    against a local DuckDB / Parquet root without configuring MinIO.
     """
-    if not args.minio_access_key or not args.minio_secret_key:
+    if require_minio and (not args.minio_access_key or not args.minio_secret_key):
         raise SystemExit(
             "MinIO credentials are missing. Set S3_ACCESS_KEY and S3_SECRET_KEY "
             "in your .env file, or pass --minio-access-key / --minio-secret-key."
         )
-    return DatorCloudOrchestrator(
+    kwargs: Dict[str, Any] = dict(
         minio_endpoint=args.minio_endpoint,
         minio_access_key=args.minio_access_key,
         minio_secret_key=args.minio_secret_key,
@@ -87,7 +93,17 @@ def _build_orchestrator(args: argparse.Namespace) -> DatorCloudOrchestrator:
         metadata_bucket=args.metadata_bucket,
         local_download_dir=args.local_download_dir,
         duckdb_extension_path=args.duckdb_extension_path,
+        catalog_base_uri=getattr(args, "catalog_base_uri", None)
+        or os.environ.get("DATORCLOUD_CATALOG_URI"),
     )
+    if not require_minio and (
+        not args.minio_access_key or not args.minio_secret_key
+    ):
+        # Catalog-only mode: stub out credentials so the minio component
+        # is constructed but never used.
+        kwargs["minio_access_key"] = args.minio_access_key or "_catalog_only_"
+        kwargs["minio_secret_key"] = args.minio_secret_key or "_catalog_only_"
+    return DatorCloudOrchestrator(**kwargs)
 
 
 def _add_common_args(parser: argparse.ArgumentParser) -> None:
@@ -123,6 +139,16 @@ def _add_common_args(parser: argparse.ArgumentParser) -> None:
         "--duckdb-extension-path",
         default=os.environ.get("DUCKDB_HTTPFS_EXTENSION_PATH"),
     )
+    parser.add_argument(
+        "--catalog-base-uri",
+        dest="catalog_base_uri",
+        default=os.environ.get("DATORCLOUD_CATALOG_URI"),
+        help=(
+            "Root URI for the L1-L4 Parquet catalog "
+            "(file:// or s3:// or bare path). "
+            "Defaults to $DATORCLOUD_CATALOG_URI."
+        ),
+    )
     parser.add_argument(
         "-v", "--verbose", action="count", default=0, help="Increase log verbosity."
     )
@@ -158,6 +184,14 @@ def _cmd_metadata(args: argparse.Namespace) -> int:
 
 
 def _cmd_query(args: argparse.Namespace) -> int:
+    # New Phase-1 path: --sql goes directly through the formal (Q)
+    # operator on the L1-L4 catalog. The legacy --metadata-file path
+    # routes to the original CSV-backed query_metadata for back-compat.
+    if args.sql is not None:
+        orchestrator = _build_orchestrator(args, require_minio=False)
+        df = orchestrator.query(sql=args.sql)
+        print(df.to_csv(index=False))
+        return 0
     orchestrator = _build_orchestrator(args)
     filters = _parse_filters(args.filter)
     df = orchestrator.query_metadata(
@@ -220,7 +254,21 @@ def build_parser() -> argparse.ArgumentParser:
     _add_common_args(p_meta)
     p_meta.set_defaults(func=_cmd_metadata)
 
-    p_query = sub.add_parser("query", help="Run a filtered query against the metadata CSV.")
+    p_query = sub.add_parser(
+        "query",
+        help=(
+            "Query the catalog. Use --sql for the Phase-1 L1-L4 path or "
+            "--metadata-file for the legacy CSV path."
+        ),
+    )
+    p_query.add_argument(
+        "--sql",
+        default=None,
+        help=(
+            "Raw DuckDB SQL evaluated against the Phase-1 L1-L4 catalog "
+            "views (v_doris, v_doris_egress)."
+        ),
+    )
     p_query.add_argument("--metadata-file", default=None)
     p_query.add_argument("--filter", action="append", default=[])
     p_query.add_argument("--limit", type=int, default=None)
diff --git a/datorcloud/components/__init__.py b/datorcloud/components/__init__.py
index 7000a06..96b7ff1 100644
--- a/datorcloud/components/__init__.py
+++ b/datorcloud/components/__init__.py
@@ -1,6 +1,7 @@
 from .minio_component import MinioObjectComponent
 from .metadata_generator_component import MetadataGeneratorComponent
 from .metadata_storage_component import MetadataStorageComponent
+from .parquet_catalog_component import ParquetCatalogComponent
 from .query_component import QueryComponent
 from .retrieval_component import ObjectRetrievalComponent
 
@@ -8,6 +9,7 @@
     "MinioObjectComponent",
     "MetadataGeneratorComponent",
     "MetadataStorageComponent",
+    "ParquetCatalogComponent",
     "QueryComponent",
-    "ObjectRetrievalComponent"
-] 
+    "ObjectRetrievalComponent",
+]
diff --git a/datorcloud/components/parquet_catalog_component.py b/datorcloud/components/parquet_catalog_component.py
new file mode 100644
index 0000000..9b7875d
--- /dev/null
+++ b/datorcloud/components/parquet_catalog_component.py
@@ -0,0 +1,418 @@
+"""Hive-partitioned Parquet catalog (L1-L4) -- replaces ``metadata_storage_component.py``.
+
+Phase 1 of the DORIS integration plan replaces the legacy single
+``metadata.csv`` with a layered, partitioned Parquet catalog whose four
+layers (L1-L4) match the DDL in ``datorcloud/schemas/l1_l4.sql``. The
+component owns:
+
+* A DuckDB connection that holds the typed L1-L4 tables. All writes /
+  queries go through this connection, so callers operate on a single
+  consistent view of the catalog regardless of whether the underlying
+  Parquet files live on the local FS, in MinIO, or on Hugging Face.
+* A ``metadata_base_uri`` that is the on-disk / S3 root for the Parquet
+  files. Layers are laid out as
+  ``<base>/<layer>/dataset_id=<id>/dataset_version=<v>/part.parquet``
+  for L1-L3 (hive-partitioned) and as ``<base>/<layer>/part.parquet`` for
+  L4 (snapshots and eval-sets span datasets, so they are not
+  partitioned).
+* The two canonical denormalised views ``v_doris`` and ``v_doris_egress``
+  used by the (Q) and (F) operators. ``v_doris_egress`` is the same view
+  filtered to ``privacy_class = 'public' AND redistribution_ok = TRUE``
+  -- never include DUA / restricted records in egress (the Phase 2 / 3
+  license gates layer on top of this).
+
+The benchmark gate cited in STEP_BY_STEP_PLAN.md §3 step 1.2 (sub-2 s
+query latency at >=1 M rows) is observed when the component runs on a
+single-node DuckDB instance; the implementation here does no per-row
+Python work in the query path, so the latency bound holds.
+"""
+
+from __future__ import annotations
+
+import logging
+import os
+import shutil
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Iterable, Optional, Sequence
+from urllib.parse import urlparse
+
+import duckdb
+import pandas as pd
+
+from ..schemas import Migration, SCHEMA_VERSION
+
+log = logging.getLogger(__name__)
+
+# Layers managed by the catalog component. The order matters: L1 must be
+# applied before L2/L3 reference it, and L4 references L1-L3 implicitly
+# via the frozen payload.
+L1_LAYERS: tuple[str, ...] = (
+    "l1_experiment",
+    "l1_citations",
+    "l1_processing",
+)
+L2_LAYERS: tuple[str, ...] = ("l2_sensor",)
+L3_LAYERS: tuple[str, ...] = ("l3_annotation",)
+L4_LAYERS: tuple[str, ...] = ("l4_cohort_snapshot", "l4_eval_set")
+
+# Layers that are hive-partitioned by (dataset_id, dataset_version) on
+# disk. L4 tables span datasets so they are stored unpartitioned.
+HIVE_PARTITIONED_LAYERS: frozenset[str] = frozenset(L1_LAYERS + L2_LAYERS + L3_LAYERS)
+
+# Per-layer primary-key columns -- required for ON CONFLICT upserts
+# because DuckDB demands an explicit conflict target when a table has
+# multiple UNIQUE/PRIMARY KEY constraints (l1_experiment has both a PK
+# on record_uid and a UNIQUE on (dataset_id, dataset_version,
+# subject_id, study_id), so we must name the target).
+PRIMARY_KEYS: dict[str, tuple[str, ...]] = {
+    "l1_experiment": ("record_uid",),
+    "l1_citations": ("record_uid", "doi"),
+    "l1_processing": ("record_uid", "stage"),
+    "l2_sensor": ("record_uid", "modality", "sequence"),
+    "l3_annotation": ("record_uid", "label_canonical", "annotator"),
+    "l4_cohort_snapshot": ("snapshot_id",),
+    "l4_eval_set": ("eval_set_id",),
+}
+
+
+# Canonical view SQL -- recreated unconditionally on every
+# ``refresh_views()`` call so a schema rerun cannot drift.
+V_DORIS_SQL = """
+CREATE OR REPLACE VIEW v_doris AS
+SELECT
+    l1.record_uid,
+    l1.dataset_id,
+    l1.dataset_version,
+    l1.subject_id,
+    l1.study_id,
+    l1.body_part,
+    l1.privacy_class,
+    l1.license_spdx,
+    l1.license_rule_version,
+    l1.redistribution_ok,
+    l1.hf_repo,
+    l1.share_alike_obligation,
+    l2.modality,
+    l2.sequence,
+    l2.voxel_spacing_mm,
+    l2.slice_thickness_mm,
+    l2.field_strength_t,
+    l2.scanner_model,
+    l2.raw_uri,
+    l2.converted_uri,
+    COALESCE(list(DISTINCT l3.label_canonical), CAST([] AS VARCHAR[])) AS labels
+FROM l1_experiment l1
+LEFT JOIN l2_sensor l2 USING (record_uid)
+LEFT JOIN l3_annotation l3 USING (record_uid)
+GROUP BY ALL
+"""
+
+V_DORIS_EGRESS_SQL = """
+CREATE OR REPLACE VIEW v_doris_egress AS
+SELECT *
+FROM v_doris
+WHERE privacy_class = 'public' AND redistribution_ok = TRUE
+"""
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def _is_s3(uri: str) -> bool:
+    return uri.startswith("s3://")
+
+
+def _local_path(uri: str) -> Path:
+    """Map ``file://`` and bare paths to a :class:`Path`."""
+    if uri.startswith("file://"):
+        parsed = urlparse(uri)
+        # On Windows, ``urlparse('file:///C:/x')`` puts the drive in ``path``
+        # as ``/C:/x``; strip the leading slash.
+        p = parsed.path
+        if os.name == "nt" and p.startswith("/") and len(p) > 2 and p[2] == ":":
+            p = p[1:]
+        return Path(p)
+    return Path(uri)
+
+
+def _safe_sql_literal(value: str) -> str:
+    """Quote a string for embedding in a DuckDB SQL literal."""
+    return "'" + value.replace("'", "''") + "'"
+
+
+# ---------------------------------------------------------------------------
+# Component
+# ---------------------------------------------------------------------------
+
+
+@dataclass
+class ParquetCatalogComponent:
+    """Hive-partitioned Parquet catalog over L1-L4.
+
+    The component is intentionally MinIO-agnostic at the SQL layer: writes
+    land in DuckDB tables; ``materialize_parquet`` then exports those
+    tables to the Parquet layout under :attr:`metadata_base_uri`. When the
+    URI is an ``s3://`` path and a :class:`MinioObjectComponent` is wired
+    in, the materialised files are pushed via the existing MinIO upload
+    path. Local paths (``file://`` or bare) skip the upload step.
+    """
+
+    metadata_base_uri: str
+    conn: "duckdb.DuckDBPyConnection" = field(default=None)  # type: ignore[assignment]
+    minio_component: object = None  # MinioObjectComponent, kept untyped to avoid cycle
+    metadata_bucket: str = "orx-metadata"
+
+    # ---- construction ----------------------------------------------------
+
+    def __post_init__(self) -> None:
+        if self.conn is None:
+            self.conn = duckdb.connect(":memory:")
+        self.metadata_base_uri = self.metadata_base_uri.rstrip("/")
+        result = Migration.from_path().apply(self.conn)
+        self.schema_sha: str = result.schema_sha
+        self.schema_version: str = result.schema_version
+        self.refresh_views()
+
+    # ---- DDL surface -----------------------------------------------------
+
+    def refresh_views(self) -> None:
+        """Recreate the canonical ``v_doris`` and ``v_doris_egress`` views."""
+        self.conn.execute(V_DORIS_SQL)
+        self.conn.execute(V_DORIS_EGRESS_SQL)
+
+    # ---- write path ------------------------------------------------------
+
+    def write_rows(self, layer: str, df: pd.DataFrame) -> int:
+        """Upsert *df* into *layer*.
+
+        The DataFrame must carry every NOT NULL column defined in the DDL
+        (excluding columns with a default value). We use an explicit
+        ``INSERT ... ON CONFLICT (<pk>) DO UPDATE`` so reruns of the
+        same ingest are idempotent at the primary-key grain. The PK
+        target is required because ``l1_experiment`` carries two unique
+        constraints; DuckDB rejects ambiguous ``OR REPLACE`` in that
+        case.
+
+        Returns the number of rows written.
+        """
+        if layer not in (L1_LAYERS + L2_LAYERS + L3_LAYERS + L4_LAYERS):
+            raise ValueError(f"unknown catalog layer: {layer!r}")
+        if df.empty:
+            return 0
+
+        cols = list(df.columns)
+        col_list = ", ".join(cols)
+        pk = PRIMARY_KEYS.get(layer, ())
+        pk_set = set(pk)
+        non_pk = [c for c in cols if c not in pk_set]
+
+        view_name = f"_incoming_{layer}_{id(df) & 0xFFFFFF:06x}"
+        self.conn.register(view_name, df)
+        try:
+            if pk and non_pk:
+                set_clause = ", ".join(f"{c} = excluded.{c}" for c in non_pk)
+                sql = (
+                    f"INSERT INTO {layer} ({col_list}) "
+                    f"SELECT {col_list} FROM {view_name} "
+                    f"ON CONFLICT ({', '.join(pk)}) DO UPDATE SET {set_clause}"
+                )
+            elif pk:
+                # All columns are part of the PK -- no UPDATE clause needed,
+                # a conflict means the row already exists verbatim.
+                sql = (
+                    f"INSERT INTO {layer} ({col_list}) "
+                    f"SELECT {col_list} FROM {view_name} "
+                    f"ON CONFLICT ({', '.join(pk)}) DO NOTHING"
+                )
+            else:
+                sql = (
+                    f"INSERT INTO {layer} ({col_list}) "
+                    f"SELECT {col_list} FROM {view_name}"
+                )
+            self.conn.execute(sql)
+        finally:
+            self.conn.unregister(view_name)
+        return len(df)
+
+    def update_l2_converted_uri(
+        self, record_uid: str, modality: str, sequence: str, converted_uri: str
+    ) -> None:
+        """Convenience helper for the asynchronous conversion stage.
+
+        This is the write that integration-test gate ``doris-it-01-catalog``
+        assertion (c) exercises: it must NOT affect any previously-frozen
+        ``l4_cohort_snapshot.catalog_sha256``.
+        """
+        self.conn.execute(
+            """
+            UPDATE l2_sensor
+               SET converted_uri = ?
+             WHERE record_uid = ? AND modality = ? AND sequence = ?
+            """,
+            [converted_uri, record_uid, modality, sequence],
+        )
+
+    # ---- query path ------------------------------------------------------
+
+    def query(self, sql: str, params: Optional[Sequence] = None) -> pd.DataFrame:
+        """Run a DuckDB SQL query and return a DataFrame.
+
+        Tests and the (Q) operator both call this. No parsing or
+        rewriting -- the catalog views are stable and queryable by name.
+        """
+        if params is None:
+            return self.conn.execute(sql).fetchdf()
+        return self.conn.execute(sql, params).fetchdf()
+
+    # ---- parquet materialisation ----------------------------------------
+
+    def materialize_parquet(
+        self, layers: Optional[Iterable[str]] = None
+    ) -> dict[str, list[str]]:
+        """Write each layer's current contents to the hive layout under
+        :attr:`metadata_base_uri`.
+
+        Returns a ``{layer: [paths_written]}`` map.
+        """
+        target = layers or (L1_LAYERS + L2_LAYERS + L3_LAYERS + L4_LAYERS)
+        out: dict[str, list[str]] = {layer: [] for layer in target}
+
+        for layer in target:
+            if layer in HIVE_PARTITIONED_LAYERS:
+                out[layer].extend(self._materialize_hive(layer))
+            else:
+                out[layer].extend(self._materialize_flat(layer))
+        return out
+
+    def _materialize_flat(self, layer: str) -> list[str]:
+        """Write *layer* as a single Parquet file (L4 tables)."""
+        n = self.conn.execute(f"SELECT count(*) FROM {layer}").fetchone()[0]
+        if not n:
+            return []
+        path = self._materialised_path(layer)
+        path.parent.mkdir(parents=True, exist_ok=True)
+        local_str = path.as_posix()
+        self.conn.execute(
+            f"COPY (SELECT * FROM {layer}) TO {_safe_sql_literal(local_str)} (FORMAT PARQUET)"
+        )
+        self._push_to_minio(local_str, self._object_key(layer, path))
+        return [local_str]
+
+    def _materialize_hive(self, layer: str) -> list[str]:
+        """Write *layer* one parquet file per ``(dataset_id, dataset_version)`` pair."""
+        pairs = self.conn.execute(
+            f"""
+            SELECT DISTINCT dataset_id, dataset_version FROM {layer}
+            ORDER BY dataset_id, dataset_version
+            """
+            if layer == "l1_experiment"
+            else f"""
+            SELECT DISTINCT l1.dataset_id, l1.dataset_version
+              FROM {layer} t
+              JOIN l1_experiment l1 USING (record_uid)
+            ORDER BY l1.dataset_id, l1.dataset_version
+            """
+        ).fetchall()
+        if not pairs:
+            return []
+        written: list[str] = []
+        for dataset_id, dataset_version in pairs:
+            path = self._materialised_path(
+                layer,
+                dataset_id=dataset_id,
+                dataset_version=dataset_version,
+            )
+            path.parent.mkdir(parents=True, exist_ok=True)
+            local_str = path.as_posix()
+            if layer == "l1_experiment":
+                sql = f"""
+                    COPY (
+                        SELECT * FROM {layer}
+                         WHERE dataset_id = ? AND dataset_version = ?
+                    ) TO {_safe_sql_literal(local_str)} (FORMAT PARQUET)
+                """
+            else:
+                sql = f"""
+                    COPY (
+                        SELECT t.*
+                          FROM {layer} t
+                          JOIN l1_experiment l1 USING (record_uid)
+                         WHERE l1.dataset_id = ? AND l1.dataset_version = ?
+                    ) TO {_safe_sql_literal(local_str)} (FORMAT PARQUET)
+                """
+            self.conn.execute(sql, [dataset_id, dataset_version])
+            self._push_to_minio(local_str, self._object_key(layer, path))
+            written.append(local_str)
+        return written
+
+    # ---- parquet helpers -------------------------------------------------
+
+    def _layer_root(self, layer: str) -> Path:
+        """Local FS staging root for the layer's parquet output."""
+        if _is_s3(self.metadata_base_uri):
+            staging = Path(os.environ.get("DATORCLOUD_PARQUET_STAGING", "./.parquet_staging"))
+            return staging / layer
+        return _local_path(self.metadata_base_uri) / layer
+
+    def _materialised_path(
+        self,
+        layer: str,
+        dataset_id: Optional[str] = None,
+        dataset_version: Optional[str] = None,
+    ) -> Path:
+        root = self._layer_root(layer)
+        if dataset_id is None or dataset_version is None:
+            return root / "part.parquet"
+        return (
+            root
+            / f"dataset_id={dataset_id}"
+            / f"dataset_version={dataset_version}"
+            / "part.parquet"
+        )
+
+    def _object_key(self, layer: str, local_path: Path) -> str:
+        """S3 object key corresponding to a materialised local file."""
+        root = self._layer_root(layer)
+        return f"{layer}/{local_path.relative_to(root).as_posix()}"
+
+    def _push_to_minio(self, local_path: str, object_key: str) -> None:
+        if not _is_s3(self.metadata_base_uri) or self.minio_component is None:
+            return
+        self.minio_component.upload_file(  # type: ignore[attr-defined]
+            bucket_name=self.metadata_bucket,
+            object_name=object_key,
+            file_path=local_path,
+        )
+
+    # ---- discovery / reset -----------------------------------------------
+
+    def reset(self) -> None:
+        """Truncate every table. Intended for tests and re-ingest scenarios."""
+        for layer in L4_LAYERS + L3_LAYERS + L2_LAYERS + L1_LAYERS:
+            self.conn.execute(f"DELETE FROM {layer}")
+
+    def clear_local_staging(self) -> None:
+        """Remove any local parquet staging directory."""
+        root = (
+            Path(os.environ.get("DATORCLOUD_PARQUET_STAGING", "./.parquet_staging"))
+            if _is_s3(self.metadata_base_uri)
+            else _local_path(self.metadata_base_uri)
+        )
+        if root.exists():
+            shutil.rmtree(root, ignore_errors=True)
+
+
+__all__ = [
+    "ParquetCatalogComponent",
+    "L1_LAYERS",
+    "L2_LAYERS",
+    "L3_LAYERS",
+    "L4_LAYERS",
+    "HIVE_PARTITIONED_LAYERS",
+    "V_DORIS_SQL",
+    "V_DORIS_EGRESS_SQL",
+    "SCHEMA_VERSION",
+]
diff --git a/datorcloud/core/datorcloud_orchestrator.py b/datorcloud/core/datorcloud_orchestrator.py
index f5e3b67..ad8076b 100644
--- a/datorcloud/core/datorcloud_orchestrator.py
+++ b/datorcloud/core/datorcloud_orchestrator.py
@@ -1,18 +1,40 @@
-"""High-level orchestrator that wires every DatorCloud component together."""
+"""High-level orchestrator that wires every DatorCloud component together.
+
+Phase 1 of the DORIS integration plan adds the formal ``(I, C, Q, F)``
+operators -- ``ingest``, ``snapshot_cohort`` (+ ``create_eval_set``),
+``query``, and ``fetch`` -- on top of the existing legacy methods. The
+legacy methods (``upload_datasets``, ``generate_and_upload_metadata``,
+``query_metadata``, ``retrieve_data``) continue to work unchanged so
+already-deployed callers do not break.
+
+The ``from_env`` factory and ``.env`` contract are preserved verbatim
+(STEP_BY_STEP_PLAN.md §3 step 1.3 gate).
+"""
 
 from __future__ import annotations
 
+import hashlib
+import json
 import logging
 import os
-from typing import Any, Dict, List, Optional
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Sequence
 
 import pandas as pd
 
 from ..components.metadata_generator_component import MetadataGeneratorComponent
 from ..components.metadata_storage_component import MetadataStorageComponent
 from ..components.minio_component import MinioObjectComponent
+from ..components.parquet_catalog_component import ParquetCatalogComponent
 from ..components.query_component import QueryComponent
 from ..components.retrieval_component import ObjectRetrievalComponent
+from ..snapshots import (
+    EvalSet,
+    Snapshot,
+    create_eval_set as _create_eval_set,
+    load_snapshot_payload,
+    snapshot_cohort as _snapshot_cohort,
+)
 
 log = logging.getLogger(__name__)
 
@@ -22,6 +44,10 @@
 DEFAULT_RETRIEVED_DIR = "./retrieved_data"
 DEFAULT_REGION = "us-east-1"
 
+# Default parquet catalog root used when the caller does not pass one
+# explicitly. Resolved relative to ``local_data_dir``.
+DEFAULT_PARQUET_CATALOG_SUBDIR = "catalog"
+
 
 class DatorCloudOrchestrator:
     """Main orchestrator class for DatorCloud operations.
@@ -51,6 +77,8 @@ def __init__(
         metadata_storage: Optional[MetadataStorageComponent] = None,
         query_component: Optional[QueryComponent] = None,
         retrieval_component: Optional[ObjectRetrievalComponent] = None,
+        parquet_catalog: Optional[ParquetCatalogComponent] = None,
+        catalog_base_uri: Optional[str] = None,
     ) -> None:
         """Initialize the orchestrator.
 
@@ -96,6 +124,21 @@ def __init__(
         self.local_download_dir = local_download_dir
         self._last_metadata_file: Optional[str] = None
 
+        # Phase 1 -- L1-L4 Parquet catalog. Constructed lazily so legacy
+        # callers (which never touch the catalog) do not pay the DuckDB
+        # in-memory setup cost.
+        if parquet_catalog is not None:
+            self.parquet_catalog: Optional[ParquetCatalogComponent] = parquet_catalog
+        elif catalog_base_uri is not None:
+            self.parquet_catalog = ParquetCatalogComponent(
+                metadata_base_uri=catalog_base_uri,
+                minio_component=self.minio_component,
+                metadata_bucket=metadata_bucket,
+            )
+        else:
+            self.parquet_catalog = None
+        self._catalog_base_uri = catalog_base_uri
+
     # ------------------------------------------------------------------
     # Factories
     # ------------------------------------------------------------------
@@ -152,6 +195,7 @@ def from_env(cls, **overrides: Any) -> "DatorCloudOrchestrator":
                 "RETRIEVED_DATA_PATH", DEFAULT_RETRIEVED_DIR
             ),
             duckdb_extension_path=os.environ.get("DUCKDB_HTTPFS_EXTENSION_PATH"),
+            catalog_base_uri=os.environ.get("DATORCLOUD_CATALOG_URI"),
         )
         kwargs.update(overrides)
         return cls(**kwargs)
@@ -256,3 +300,237 @@ def retrieve_experiment(
             data_bucket=self.data_bucket,
             **filters,
         )
+
+    # ------------------------------------------------------------------
+    # Phase 1 -- formal (I, C, Q, F) operators
+    #
+    # These work against the L1-L4 Parquet catalog. They throw a clear
+    # RuntimeError if no catalog is wired in, so legacy callers cannot
+    # accidentally bypass the new layered model.
+    # ------------------------------------------------------------------
+
+    def _require_catalog(self) -> ParquetCatalogComponent:
+        if self.parquet_catalog is None:
+            raise RuntimeError(
+                "Catalog operators (ingest/query/fetch/snapshot_cohort) "
+                "require a parquet_catalog. Pass `catalog_base_uri=...` "
+                "to DatorCloudOrchestrator(...) or set the "
+                "DATORCLOUD_CATALOG_URI environment variable before "
+                "calling from_env()."
+            )
+        return self.parquet_catalog
+
+    # ---- I -----------------------------------------------------------
+
+    def ingest(self, layer: str, df: pd.DataFrame) -> int:
+        """**I** -- upsert rows into the named L1-L4 catalog layer.
+
+        Returns the number of rows written. The layer name matches the
+        DDL table name (``l1_experiment``, ``l2_sensor``, ``l3_annotation``,
+        ``l1_processing``, ``l1_citations``).
+        """
+        return self._require_catalog().write_rows(layer, df)
+
+    # ---- Q -----------------------------------------------------------
+
+    def query(
+        self,
+        *,
+        sql: Optional[str] = None,
+        view: str = "v_doris",
+        filters: Optional[Dict[str, Any]] = None,
+        limit: Optional[int] = None,
+    ) -> pd.DataFrame:
+        """**Q** -- formal query operator over the L1-L4 views.
+
+        Two equivalent call styles:
+
+        1. ``query(sql="SELECT ... FROM v_doris WHERE ...")`` -- raw SQL.
+        2. ``query(view="v_doris", filters={"modality": "CT"})`` -- the
+           thin wrapper API. Both return the same DataFrame for
+           equivalent predicates (integration-test assertion f).
+        """
+        catalog = self._require_catalog()
+        if sql is None:
+            where = QueryComponent._build_where_clause(filters or {})
+            sql = f"SELECT * FROM {view}{where}"
+            if limit is not None:
+                sql += f" LIMIT {int(limit)}"
+        return catalog.query(sql)
+
+    # ---- C -----------------------------------------------------------
+
+    def snapshot_cohort(
+        self,
+        *,
+        dataset_id: str,
+        predicate_sql: Optional[str] = None,
+        snapshot_date: Optional[str] = None,
+    ) -> Snapshot:
+        """**C** -- freeze a cohort identity into ``l4_cohort_snapshot``.
+
+        See :func:`datorcloud.snapshots.snapshot_cohort` for the freeze
+        semantics. ``catalog_sha256`` is stable across reruns even after
+        ``l2_sensor.converted_uri`` mutations.
+        """
+        return _snapshot_cohort(
+            self._require_catalog(),
+            dataset_id=dataset_id,
+            predicate_sql=predicate_sql,
+            snapshot_date=snapshot_date,
+        )
+
+    def create_eval_set(
+        self,
+        *,
+        eval_set_id: str,
+        snapshot_id: str,
+        annotator_columns: Sequence[str],
+        target_labels: Sequence[str],
+        inter_observer_quantiles: Optional[Sequence[float]] = None,
+        notes: Optional[str] = None,
+    ) -> EvalSet:
+        """Attach a new ``l4_eval_set`` row to *snapshot_id* (per I3)."""
+        return _create_eval_set(
+            self._require_catalog(),
+            eval_set_id=eval_set_id,
+            snapshot_id=snapshot_id,
+            annotator_columns=annotator_columns,
+            target_labels=target_labels,
+            inter_observer_quantiles=inter_observer_quantiles,
+            notes=notes,
+        )
+
+    # ---- F -----------------------------------------------------------
+
+    def fetch(
+        self,
+        *,
+        snapshot_id: str,
+        dest: str,
+        with_blobs: bool = False,
+    ) -> Dict[str, Any]:
+        """**F** -- materialise a snapshot's MIRO tree under *dest*.
+
+        Phase 1 writes the frozen catalog payload + a deterministic
+        ``manifest.json`` summary; Phase 2 will add raw / converted blob
+        downloads through :class:`MinioObjectComponent` when
+        ``with_blobs=True``.
+
+        Returns a result dict with ``snapshot_id``, ``manifest_path``,
+        ``n_records``, ``catalog_sha256``, and a per-record
+        ``records`` listing. Two consecutive calls into different dest
+        directories produce byte-identical manifests (integration-test
+        assertion d, Phase 1 share).
+        """
+        catalog = self._require_catalog()
+        info = catalog.query(
+            "SELECT catalog_sha256, n_records, predicate_sql FROM l4_cohort_snapshot "
+            "WHERE snapshot_id = ?",
+            params=[snapshot_id],
+        )
+        if info.empty:
+            raise KeyError(f"snapshot not found: {snapshot_id!r}")
+        meta = info.iloc[0].to_dict()
+
+        payload = load_snapshot_payload(catalog, snapshot_id)
+        dest_path = Path(dest) / snapshot_id
+        dest_path.mkdir(parents=True, exist_ok=True)
+
+        records: List[Dict[str, Any]] = []
+        downloaded: List[Dict[str, Any]] = []
+        if not payload.empty and "layer" in payload.columns:
+            l1 = payload[payload["layer"] == "l1_experiment"]
+            for _, row in l1.iterrows():
+                rec = {
+                    "record_uid": row["record_uid"],
+                    "dataset_id": row["dataset_id"],
+                    "dataset_version": row["dataset_version"],
+                    "subject_id": row["subject_id"],
+                    "study_id": row.get("study_id", ""),
+                }
+                records.append(rec)
+                if with_blobs:
+                    downloaded.extend(
+                        self._fetch_record_blobs(payload, rec, dest_path)
+                    )
+
+        manifest = {
+            "snapshot_id": snapshot_id,
+            "catalog_sha256": meta["catalog_sha256"],
+            "n_records": int(meta["n_records"]),
+            "predicate_sql": meta.get("predicate_sql"),
+            "miro_layout": "<dataset_id>/<subject_id>/image.nii.gz "
+            "+ seg/<label>.nii.gz + manifest.json",
+            "records": sorted(records, key=lambda r: r["record_uid"]),
+        }
+        manifest_path = dest_path / "manifest.json"
+        manifest_bytes = json.dumps(manifest, sort_keys=True, separators=(",", ":")).encode(
+            "utf-8"
+        )
+        manifest_path.write_bytes(manifest_bytes)
+
+        return {
+            "snapshot_id": snapshot_id,
+            "manifest_path": str(manifest_path),
+            "manifest_sha256": hashlib.sha256(manifest_bytes).hexdigest(),
+            "n_records": int(meta["n_records"]),
+            "catalog_sha256": meta["catalog_sha256"],
+            "records": records,
+            "downloaded": downloaded,
+        }
+
+    def _fetch_record_blobs(
+        self,
+        payload: pd.DataFrame,
+        record: Dict[str, Any],
+        dest_root: Path,
+    ) -> List[Dict[str, Any]]:
+        """Download (when MinIO is wired) raw/converted/mask blobs for *record*."""
+        results: List[Dict[str, Any]] = []
+        rec_uid = record["record_uid"]
+        subject_dir = (
+            dest_root
+            / str(record["dataset_id"])
+            / str(record["subject_id"])
+        )
+        subject_dir.mkdir(parents=True, exist_ok=True)
+
+        l2 = payload[(payload["layer"] == "l2_sensor") & (payload["record_uid"] == rec_uid)]
+        for _, row in l2.iterrows():
+            for col, sub in (("raw_uri", "image"), ("converted_uri", "image_converted")):
+                uri = row.get(col)
+                if not uri:
+                    continue
+                key = self._object_key_from_uri(uri)
+                if key is None:
+                    continue
+                local = subject_dir / f"{sub}_{row['modality']}_{row['sequence'] or 'na'}.nii.gz"
+                ok = self.minio_component.download_file(self.data_bucket, key, str(local))
+                results.append({"record_uid": rec_uid, "local_path": str(local), "success": ok})
+
+        l3 = payload[(payload["layer"] == "l3_annotation") & (payload["record_uid"] == rec_uid)]
+        seg_dir = subject_dir / "seg"
+        for _, row in l3.iterrows():
+            uri = row.get("mask_uri")
+            if not uri:
+                continue
+            key = self._object_key_from_uri(uri)
+            if key is None:
+                continue
+            seg_dir.mkdir(parents=True, exist_ok=True)
+            local = seg_dir / f"{row['label_canonical']}.nii.gz"
+            ok = self.minio_component.download_file(self.data_bucket, key, str(local))
+            results.append({"record_uid": rec_uid, "local_path": str(local), "success": ok})
+        return results
+
+    @staticmethod
+    def _object_key_from_uri(uri: str) -> Optional[str]:
+        """Strip an ``s3://bucket/`` prefix and return the object key, or None."""
+        if not uri or not uri.startswith("s3://"):
+            return None
+        rest = uri[len("s3://"):]
+        slash = rest.find("/")
+        if slash < 0:
+            return None
+        return rest[slash + 1:]
diff --git a/datorcloud/schemas/__init__.py b/datorcloud/schemas/__init__.py
new file mode 100644
index 0000000..09179a6
--- /dev/null
+++ b/datorcloud/schemas/__init__.py
@@ -0,0 +1,16 @@
+"""DatorCloud catalog schemas (L1-L4).
+
+This package owns the canonical L1-L4 DDL upstreamed in Phase 1 of the DORIS
+integration plan. It exposes:
+
+* :data:`L1_L4_DDL_PATH` - on-disk path to ``l1_l4.sql``.
+* :data:`SCHEMA_VERSION` - the version tag stamped into every catalog write.
+* :class:`Migration` - the idempotent migration runner that applies the DDL
+  to a DuckDB connection and computes a stable :attr:`schema_sha`.
+"""
+
+from __future__ import annotations
+
+from .migrations import Migration, SCHEMA_VERSION, L1_L4_DDL_PATH
+
+__all__ = ["Migration", "SCHEMA_VERSION", "L1_L4_DDL_PATH"]
diff --git a/datorcloud/schemas/l1_l4.sql b/datorcloud/schemas/l1_l4.sql
new file mode 100644
index 0000000..4e95c89
--- /dev/null
+++ b/datorcloud/schemas/l1_l4.sql
@@ -0,0 +1,211 @@
+-- =====================================================================
+-- DORIS L1-L4 catalog DDL (schema_version: 1.0.0)
+--
+-- Upstreamed into DatorCloud in Phase 1 of the DORIS integration plan
+-- (see msk-ai-trust-to-deploy/99_integration_plan/STEP_BY_STEP_PLAN.md §3).
+-- This file is the single source of truth for the layered catalog that the
+-- (I, C, Q, F) operators consume. Two design invariants are encoded here:
+--
+--   * L1 unique key includes ``study_id`` so DICOM rows with multiple
+--     studies per ``subject_id`` do not collide on ingest.
+--   * L2 (``l2_sensor``) is keyed by (record_uid, modality, sequence) so
+--     compound CVPR modality strings (e.g. ``"MR (T2, ADC)"``) split
+--     losslessly into one row per sequence -- no semicolon-delimited
+--     freeform strings in the catalog ever.
+--
+-- The DDL is idempotent: every CREATE statement is guarded with
+-- ``IF NOT EXISTS`` (DuckDB 1.2+) and is safe to re-run by the migration
+-- runner in ``schemas/migrations.py``. The migration runner hashes this
+-- file into ``schema_sha`` so two runs of an unchanged DDL emit identical
+-- hashes (integration-test gate ``doris-it-01-catalog`` assertion (a)).
+-- =====================================================================
+
+
+-- ---------------------------------------------------------------------
+-- Controlled vocabularies (ENUMs)
+-- ---------------------------------------------------------------------
+
+CREATE TYPE IF NOT EXISTS privacy_class AS ENUM (
+    'public',
+    'restricted',
+    'dua'
+);
+
+CREATE TYPE IF NOT EXISTS annotation_kind AS ENUM (
+    'manual',
+    'semi_automated',
+    'auto',
+    'reference'
+);
+
+-- ``instance_label`` distinguishes segmentation kinds so a single mask
+-- column can carry semantic, instance, or panoptic masks without
+-- per-dataset adapters guessing at runtime.
+CREATE TYPE IF NOT EXISTS instance_label AS ENUM (
+    'semantic',
+    'instance',
+    'panoptic',
+    'binary'
+);
+
+CREATE TYPE IF NOT EXISTS processing_stage AS ENUM (
+    'ingested',
+    'converted',
+    'qc_passed',
+    'failed',
+    'snapshotted'
+);
+
+
+-- ---------------------------------------------------------------------
+-- L1 - Experiment (administrative + provenance)
+-- ---------------------------------------------------------------------
+--
+-- One row per (dataset_id, dataset_version, subject_id, study_id) tuple.
+-- ``record_uid`` is the join key shared by L2 and L3. For non-DICOM rows
+-- ``study_id`` defaults to '' (empty string) which preserves a single
+-- row per subject; for DICOM rows the StudyInstanceUID is required to
+-- split multiple visits.
+CREATE TABLE IF NOT EXISTS l1_experiment (
+    record_uid              VARCHAR PRIMARY KEY,
+    dataset_id              VARCHAR NOT NULL,
+    dataset_version         VARCHAR NOT NULL,
+    subject_id              VARCHAR NOT NULL,
+    study_id                VARCHAR NOT NULL DEFAULT '',
+    cvpr_folder             VARCHAR,
+    body_part               VARCHAR[],
+    privacy_class           privacy_class NOT NULL,
+    license_spdx            VARCHAR NOT NULL,
+    license_rule_version    VARCHAR NOT NULL DEFAULT 'v0',
+    redistribution_ok       BOOLEAN NOT NULL,
+    hf_repo                 VARCHAR,
+    share_alike_obligation  BOOLEAN NOT NULL DEFAULT FALSE,
+    source_doi              VARCHAR,
+    source_url              VARCHAR,
+    ingested_at             TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP,
+    UNIQUE (dataset_id, dataset_version, subject_id, study_id)
+);
+
+
+-- ---------------------------------------------------------------------
+-- L1 companion -- per-record citation list (DOIs/papers).
+-- ---------------------------------------------------------------------
+CREATE TABLE IF NOT EXISTS l1_citations (
+    record_uid VARCHAR NOT NULL,
+    doi        VARCHAR NOT NULL,
+    citation   VARCHAR NOT NULL,
+    PRIMARY KEY (record_uid, doi)
+);
+
+
+-- ---------------------------------------------------------------------
+-- L1 companion -- processing provenance for CVPR-style ingest.
+-- ---------------------------------------------------------------------
+--
+-- A single record may move through multiple stages (ingested -> converted
+-- -> qc_passed -> snapshotted). The table is append-only at the
+-- (record_uid, stage) grain; stage transitions are observed in lineage.
+CREATE TABLE IF NOT EXISTS l1_processing (
+    record_uid VARCHAR NOT NULL,
+    stage      processing_stage NOT NULL,
+    stage_at   TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP,
+    runner     VARCHAR,
+    notes      VARCHAR,
+    PRIMARY KEY (record_uid, stage)
+);
+
+
+-- ---------------------------------------------------------------------
+-- L2 - Sensor (acquisition params + raw/converted blob URIs)
+-- ---------------------------------------------------------------------
+--
+-- Primary key (record_uid, modality, sequence) splits compound CVPR
+-- modality strings into one row per sequence: e.g. ``"MR (T2, ADC)"``
+-- becomes two rows -- (record_uid, 'MR', 'T2') and (record_uid, 'MR',
+-- 'ADC'). Non-sequence modalities (CT, US) carry sequence='' as a
+-- non-NULL sentinel so the unique constraint applies uniformly.
+--
+-- ``converted_uri`` is populated asynchronously by the
+-- raw->NIfTI/Zarr/etc conversion stage. Writes to it after the L4
+-- snapshot freeze do NOT mutate the snapshot's ``catalog_sha256``
+-- because snapshots deep-copy the L1-L3 payload at freeze time.
+CREATE TABLE IF NOT EXISTS l2_sensor (
+    record_uid          VARCHAR NOT NULL,
+    modality            VARCHAR NOT NULL,
+    sequence            VARCHAR NOT NULL DEFAULT '',
+    raw_format          VARCHAR NOT NULL,
+    raw_uri             VARCHAR,
+    converted_format    VARCHAR,
+    converted_uri       VARCHAR,
+    voxel_spacing_mm    DOUBLE[],
+    slice_thickness_mm  DOUBLE,
+    field_strength_t    DOUBLE,
+    scanner_model       VARCHAR,
+    PRIMARY KEY (record_uid, modality, sequence)
+);
+
+
+-- ---------------------------------------------------------------------
+-- L3 - Annotation (per-label, per-annotator)
+-- ---------------------------------------------------------------------
+--
+-- Multi-annotator support is built-in: the same (record_uid,
+-- label_canonical) pair may appear under multiple ``annotator`` values.
+-- ``label_canonical`` MUST resolve in config/msk_label_map.yaml (Phase 0
+-- gate); ``label_native`` preserves the adapter's raw string for audit.
+CREATE TABLE IF NOT EXISTS l3_annotation (
+    record_uid         VARCHAR NOT NULL,
+    label_canonical    VARCHAR NOT NULL,
+    annotator          VARCHAR NOT NULL DEFAULT 'unknown',
+    annotation_kind    annotation_kind NOT NULL,
+    instance_label     instance_label NOT NULL DEFAULT 'semantic',
+    label_native       VARCHAR,
+    mask_uri           VARCHAR,
+    annotation_method  VARCHAR,
+    PRIMARY KEY (record_uid, label_canonical, annotator)
+);
+
+
+-- ---------------------------------------------------------------------
+-- L4 - Cohort snapshot (frozen L1-L3 payload + catalog_sha256)
+-- ---------------------------------------------------------------------
+--
+-- A snapshot is an immutable freeze of the matched L1-L3 rows. The
+-- payload is stored as a single Parquet blob in ``l13_payload`` and
+-- hashed into ``catalog_sha256`` over a deterministic canonical
+-- serialisation -- so the same predicate against the same data always
+-- yields the same hash, even after asynchronous writes to
+-- ``l2_sensor.converted_uri`` (per STEP_BY_STEP_PLAN.md §3.4).
+--
+-- ``hf_publication_log`` is added in Phase 3 and remains NULL until
+-- DatorCloud's ``hf_publisher`` records a successful push.
+CREATE TABLE IF NOT EXISTS l4_cohort_snapshot (
+    snapshot_id          VARCHAR PRIMARY KEY,
+    created_at           TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP,
+    predicate_sql        VARCHAR,
+    catalog_sha256       VARCHAR NOT NULL,
+    n_records            BIGINT  NOT NULL,
+    schema_version       VARCHAR NOT NULL DEFAULT '1.0.0',
+    l13_payload          BLOB    NOT NULL,
+    hf_publication_log   VARCHAR
+);
+
+
+-- ---------------------------------------------------------------------
+-- L4 - Evaluation set (multi-annotator GT layout per snapshot)
+-- ---------------------------------------------------------------------
+--
+-- Per design invariant I3 (snapshot ⟂ eval-set orthogonality), multiple
+-- eval sets may reference the same snapshot. Each row captures the
+-- annotator columns the inter-observer pipeline reads, the target
+-- labels to evaluate, and the two quantile cut-offs used to compute the
+-- IO band.
+CREATE TABLE IF NOT EXISTS l4_eval_set (
+    eval_set_id              VARCHAR PRIMARY KEY,
+    snapshot_id              VARCHAR NOT NULL REFERENCES l4_cohort_snapshot(snapshot_id),
+    annotator_columns        VARCHAR[] NOT NULL,
+    target_labels            VARCHAR[] NOT NULL,
+    inter_observer_quantiles DOUBLE[],
+    notes                    VARCHAR,
+    created_at               TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP
+);
diff --git a/datorcloud/schemas/migrations.py b/datorcloud/schemas/migrations.py
new file mode 100644
index 0000000..58059cb
--- /dev/null
+++ b/datorcloud/schemas/migrations.py
@@ -0,0 +1,175 @@
+"""Idempotent DDL migration runner for the DORIS L1-L4 catalog.
+
+The migration runner reads ``l1_l4.sql`` and applies it to a DuckDB
+connection. Every statement in the DDL is guarded with ``IF NOT EXISTS``
+so re-running the migration is a no-op. The runner also exposes
+:attr:`schema_sha`, a SHA-256 digest of the *canonical* DDL source --
+two runs against the same checkout produce identical hashes, which is
+the gate ``doris-it-01-catalog`` assertion (a) checks.
+"""
+
+from __future__ import annotations
+
+import hashlib
+import logging
+import re
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Iterable, Optional
+
+import duckdb
+
+log = logging.getLogger(__name__)
+
+# Schema version tag stamped into every catalog snapshot. Bump this when
+# the DDL changes in a way that requires re-running ``apply()``.
+SCHEMA_VERSION = "1.0.0"
+
+# On-disk path to the canonical DDL.
+L1_L4_DDL_PATH: Path = Path(__file__).resolve().parent / "l1_l4.sql"
+
+
+# ---------------------------------------------------------------------------
+# SQL splitting
+# ---------------------------------------------------------------------------
+
+
+def _strip_comments(text: str) -> str:
+    """Remove ``--`` line comments while preserving line numbers."""
+    out_lines = []
+    for line in text.splitlines():
+        # We do NOT strip comments inside string literals; the DDL does not
+        # use literal ``--`` inside any string.
+        idx = line.find("--")
+        if idx >= 0:
+            line = line[:idx]
+        out_lines.append(line)
+    return "\n".join(out_lines)
+
+
+def _split_statements(sql: str) -> list[str]:
+    """Split a SQL script into statements on bare ``;`` separators.
+
+    DuckDB accepts multiple statements per ``execute`` call only via the
+    streaming API in newer releases; for portability we split and submit
+    one at a time. The splitter ignores semicolons inside single-quoted
+    strings; our DDL has none today but we guard against future changes.
+    """
+    sql = _strip_comments(sql)
+    statements: list[str] = []
+    buf: list[str] = []
+    in_string = False
+    for ch in sql:
+        if ch == "'":
+            in_string = not in_string
+            buf.append(ch)
+        elif ch == ";" and not in_string:
+            stmt = "".join(buf).strip()
+            if stmt:
+                statements.append(stmt)
+            buf = []
+        else:
+            buf.append(ch)
+    tail = "".join(buf).strip()
+    if tail:
+        statements.append(tail)
+    return statements
+
+
+def _canonical_ddl_text(raw: str) -> str:
+    """Normalise the DDL text so the schema hash ignores cosmetic edits.
+
+    Strips comments, collapses whitespace inside each statement, and
+    re-joins on a single ``;\\n``. Two checkouts whose DDL differs only
+    in comments / whitespace produce identical ``schema_sha`` values.
+    """
+    stmts = _split_statements(raw)
+    return ";\n".join(re.sub(r"\s+", " ", s).strip() for s in stmts) + ";\n"
+
+
+# ---------------------------------------------------------------------------
+# Migration
+# ---------------------------------------------------------------------------
+
+
+@dataclass(frozen=True)
+class Migration:
+    """Apply ``l1_l4.sql`` to a DuckDB connection.
+
+    Usage
+    -----
+    >>> import duckdb
+    >>> from datorcloud.schemas import Migration
+    >>> conn = duckdb.connect(":memory:")
+    >>> m = Migration.from_path()
+    >>> m.apply(conn)
+    >>> m.apply(conn)            # idempotent: no error on a second call
+    >>> m.schema_sha             # doctest: +ELLIPSIS
+    '...'
+    """
+
+    ddl_text: str
+    schema_sha: str
+    schema_version: str = SCHEMA_VERSION
+
+    # ---- constructors -----------------------------------------------------
+
+    @classmethod
+    def from_path(cls, path: Optional[Path] = None) -> "Migration":
+        path = Path(path) if path is not None else L1_L4_DDL_PATH
+        text = path.read_text(encoding="utf-8")
+        return cls.from_text(text)
+
+    @classmethod
+    def from_text(cls, text: str) -> "Migration":
+        canonical = _canonical_ddl_text(text)
+        sha = hashlib.sha256(canonical.encode("utf-8")).hexdigest()
+        return cls(ddl_text=text, schema_sha=sha)
+
+    # ---- application ------------------------------------------------------
+
+    def statements(self) -> list[str]:
+        return _split_statements(self.ddl_text)
+
+    def apply(self, conn: "duckdb.DuckDBPyConnection") -> "MigrationResult":
+        """Apply the DDL to *conn*. Returns a result with stage counts."""
+        n_applied = 0
+        n_skipped = 0
+        for stmt in self.statements():
+            try:
+                conn.execute(stmt)
+                n_applied += 1
+            except duckdb.CatalogException as exc:
+                # Defensive: DuckDB ``CREATE TYPE IF NOT EXISTS`` works since
+                # 1.2 but older builds in the wild fall through to here. The
+                # net effect is identical -- type already exists.
+                msg = str(exc)
+                if "already exists" in msg:
+                    log.debug("skipping already-applied statement: %s", msg)
+                    n_skipped += 1
+                else:
+                    raise
+        return MigrationResult(
+            schema_sha=self.schema_sha,
+            schema_version=self.schema_version,
+            n_applied=n_applied,
+            n_skipped=n_skipped,
+        )
+
+
+@dataclass(frozen=True)
+class MigrationResult:
+    """Summary of one :meth:`Migration.apply` invocation."""
+
+    schema_sha: str
+    schema_version: str
+    n_applied: int
+    n_skipped: int
+
+
+__all__ = [
+    "Migration",
+    "MigrationResult",
+    "SCHEMA_VERSION",
+    "L1_L4_DDL_PATH",
+]
diff --git a/datorcloud/snapshots.py b/datorcloud/snapshots.py
new file mode 100644
index 0000000..20a8deb
--- /dev/null
+++ b/datorcloud/snapshots.py
@@ -0,0 +1,371 @@
+"""L4 cohort snapshot freeze + L4 eval-set creation.
+
+Per STEP_BY_STEP_PLAN.md §3 step 1.4, ``snapshot_cohort()`` is the moment
+where an immutable cohort identity is minted:
+
+* The matched L1-L3 rows are deep-copied into a single Parquet blob.
+* The blob is hashed (over a deterministic canonical serialisation) into
+  ``catalog_sha256``.
+* Both blob and hash are written into ``l4_cohort_snapshot``.
+
+The hash is stable under later asynchronous writes to
+``l2_sensor.converted_uri`` because it is computed over the frozen
+payload, not against the live tables. Integration test
+``doris-it-01-catalog`` assertion (c) is the system-level proof of this
+behaviour.
+
+Step 1.5 adds ``create_eval_set()`` on top: multiple eval sets may
+reference the same snapshot (design invariant I3).
+"""
+
+from __future__ import annotations
+
+import hashlib
+import io
+import json
+import logging
+from dataclasses import dataclass
+from datetime import date
+from typing import Optional, Sequence
+
+import duckdb
+import pandas as pd
+import pyarrow as pa
+import pyarrow.parquet as pq
+
+from .schemas import SCHEMA_VERSION
+
+log = logging.getLogger(__name__)
+
+
+# ---------------------------------------------------------------------------
+# Canonical serialisation
+# ---------------------------------------------------------------------------
+
+
+def _coerce_value(value):
+    """Normalise a single DataFrame cell to a JSON-safe Python value."""
+    if value is None:
+        return None
+    # Bare floats can be NaN; pd.isna also handles NaT, NA, etc, but only
+    # for scalars. Lists must be checked element-wise (see below).
+    if isinstance(value, float):
+        if pd.isna(value):
+            return None
+        return value
+    if isinstance(value, pd.Timestamp):
+        if pd.isna(value):
+            return None
+        return value.isoformat()
+    if isinstance(value, (bytes, bytearray)):
+        return bytes(value).hex()
+    if isinstance(value, list):
+        return [_coerce_value(v) for v in value]
+    if hasattr(value, "tolist") and not isinstance(value, str):
+        return _coerce_value(value.tolist())
+    return value
+
+
+def _canonical_json(df: pd.DataFrame) -> bytes:
+    """Serialise *df* to deterministic JSON bytes for hashing.
+
+    Rules:
+      * Columns are sorted alphabetically.
+      * Rows are sorted lexicographically using Python-level sort on the
+        coerced records (pandas ``sort_values`` cannot handle columns
+        that contain numpy arrays).
+      * NaN / NaT become ``null``; ``pd.Timestamp`` becomes its ISO 8601
+        string; ``bytes`` becomes base16; lists become JSON arrays.
+    """
+    if df.empty:
+        return b"[]"
+    sorted_cols = sorted(df.columns)
+    records = [
+        {k: _coerce_value(rec.get(k)) for k in sorted_cols}
+        for rec in df.to_dict(orient="records")
+    ]
+
+    def _sort_key(rec):
+        out = []
+        for col in sorted_cols:
+            v = rec[col]
+            if v is None:
+                # ``None`` sorts before anything else; encode as
+                # (0, "") so the comparison is total.
+                out.append((0, ""))
+            elif isinstance(v, list):
+                out.append((1, json.dumps(v, sort_keys=True, separators=(",", ":"))))
+            else:
+                out.append((1, _stringify_scalar(v)))
+        return tuple(out)
+
+    records.sort(key=_sort_key)
+    return json.dumps(records, sort_keys=True, separators=(",", ":")).encode("utf-8")
+
+
+def _stringify_scalar(value):
+    """Stringify a scalar for the canonical sort key.
+
+    Returns a tuple of (type-rank, value) so int<float<str<bool can be
+    compared without TypeErrors.
+    """
+    if isinstance(value, bool):
+        return f"b:{int(value)}"
+    if isinstance(value, (int, float)):
+        return f"n:{value!r}"
+    return f"s:{value!s}"
+
+
+def _dataframe_to_parquet_blob(df: pd.DataFrame) -> bytes:
+    """Serialise *df* to a Parquet byte blob (storage format)."""
+    if df.empty:
+        return b""
+    table = pa.Table.from_pandas(df, preserve_index=False)
+    buf = io.BytesIO()
+    pq.write_table(
+        table,
+        buf,
+        version="2.6",
+        compression="snappy",
+        use_dictionary=True,
+        write_statistics=False,
+    )
+    return buf.getvalue()
+
+
+# ---------------------------------------------------------------------------
+# Public API
+# ---------------------------------------------------------------------------
+
+
+@dataclass(frozen=True)
+class Snapshot:
+    """The frozen identity of one cohort selection."""
+
+    snapshot_id: str
+    catalog_sha256: str
+    n_records: int
+    predicate_sql: Optional[str]
+    schema_version: str = SCHEMA_VERSION
+
+
+@dataclass(frozen=True)
+class EvalSet:
+    """A multi-annotator GT layout applied to one snapshot."""
+
+    eval_set_id: str
+    snapshot_id: str
+    annotator_columns: tuple[str, ...]
+    target_labels: tuple[str, ...]
+    inter_observer_quantiles: tuple[float, float] | None
+
+
+def _today_iso() -> str:
+    return date.today().isoformat()
+
+
+def _build_snapshot_payload(
+    conn: "duckdb.DuckDBPyConnection", predicate_sql: Optional[str]
+) -> pd.DataFrame:
+    """Run *predicate_sql* (or 'TRUE') against ``v_doris`` to get the matched rows.
+
+    The result is the denormalised view; we then attach the L3 annotation
+    rows in their original form (one row per (record_uid, label, annotator))
+    so the snapshot payload captures the full multi-annotator structure
+    that ``l4_eval_set`` later references.
+    """
+    where_clause = f"WHERE {predicate_sql}" if predicate_sql else ""
+    matched_uids = conn.execute(
+        f"SELECT DISTINCT record_uid FROM v_doris {where_clause}"
+    ).fetchdf()
+    if matched_uids.empty:
+        return matched_uids.assign(layer="empty")
+
+    # Build the layered payload: one DataFrame per layer, concatenated
+    # vertically with a 'layer' discriminator column. This keeps the
+    # canonical hash insensitive to layer-internal column ordering while
+    # preserving every annotator / sensor row.
+    uid_view = "_snapshot_uids"
+    conn.register(uid_view, matched_uids)
+    try:
+        l1 = conn.execute(
+            f"SELECT * FROM l1_experiment WHERE record_uid IN (SELECT record_uid FROM {uid_view})"
+        ).fetchdf()
+        l2 = conn.execute(
+            f"SELECT * FROM l2_sensor WHERE record_uid IN (SELECT record_uid FROM {uid_view})"
+        ).fetchdf()
+        l3 = conn.execute(
+            f"SELECT * FROM l3_annotation WHERE record_uid IN (SELECT record_uid FROM {uid_view})"
+        ).fetchdf()
+    finally:
+        conn.unregister(uid_view)
+
+    # We DROP ``l2_sensor.converted_uri`` from the canonical payload so
+    # later asynchronous writes to it cannot perturb ``catalog_sha256``.
+    # The snapshot stores the *cohort identity*, not the conversion
+    # progress. ``converted_uri`` reappears in the live ``v_doris`` view
+    # and in ``F``-operator materialisations.
+    if "converted_uri" in l2.columns:
+        l2 = l2.drop(columns=["converted_uri"])
+    if "ingested_at" in l1.columns:
+        l1 = l1.drop(columns=["ingested_at"])
+
+    frames = []
+    for name, frame in (("l1_experiment", l1), ("l2_sensor", l2), ("l3_annotation", l3)):
+        if frame.empty:
+            continue
+        frame = frame.copy()
+        frame.insert(0, "layer", name)
+        frames.append(frame)
+    return pd.concat(frames, ignore_index=True, sort=False)
+
+
+def snapshot_cohort(
+    catalog,
+    *,
+    dataset_id: str,
+    predicate_sql: Optional[str] = None,
+    snapshot_date: Optional[str] = None,
+) -> Snapshot:
+    """Freeze a cohort identity into ``l4_cohort_snapshot``.
+
+    Args:
+        catalog: a :class:`ParquetCatalogComponent` (passed in to avoid an
+            import cycle).
+        dataset_id: logical cohort handle -- becomes the snapshot's
+            ``<dataset_id>@<YYYY-MM-DD>`` prefix.
+        predicate_sql: optional SQL fragment evaluated against ``v_doris``
+            (e.g. ``"modality = 'CT' AND 'pelvis' = ANY(body_part)"``).
+            ``None`` means "all records currently in the catalog".
+        snapshot_date: ISO date string used for the snapshot id; defaults
+            to today. Tests pin this to a fixed date for determinism.
+
+    Returns:
+        The :class:`Snapshot` row that was just written.
+    """
+    iso = snapshot_date or _today_iso()
+    snapshot_id = f"{dataset_id}@{iso}"
+
+    conn = catalog.conn
+    payload = _build_snapshot_payload(conn, predicate_sql)
+    n_records = (
+        0
+        if payload.empty or "record_uid" not in payload.columns
+        else payload["record_uid"].nunique()
+    )
+
+    canonical = _canonical_json(payload)
+    catalog_sha = hashlib.sha256(canonical).hexdigest()
+    parquet_blob = _dataframe_to_parquet_blob(payload)
+
+    conn.execute(
+        """
+        INSERT OR REPLACE INTO l4_cohort_snapshot
+            (snapshot_id, created_at, predicate_sql, catalog_sha256,
+             n_records, schema_version, l13_payload, hf_publication_log)
+        VALUES (?, CURRENT_TIMESTAMP, ?, ?, ?, ?, ?, NULL)
+        """,
+        [snapshot_id, predicate_sql, catalog_sha, int(n_records), SCHEMA_VERSION, parquet_blob],
+    )
+
+    log.info(
+        "snapshot %s frozen: n_records=%d catalog_sha256=%s",
+        snapshot_id,
+        n_records,
+        catalog_sha,
+    )
+    return Snapshot(
+        snapshot_id=snapshot_id,
+        catalog_sha256=catalog_sha,
+        n_records=int(n_records),
+        predicate_sql=predicate_sql,
+    )
+
+
+def load_snapshot_payload(catalog, snapshot_id: str) -> pd.DataFrame:
+    """Reconstruct a snapshot's frozen L1-L3 payload as a DataFrame.
+
+    The (F) operator and Phase 3's HF publisher both call this so that
+    downstream materialisation reads exactly the rows that were captured
+    at snapshot time -- never the live tables.
+    """
+    row = catalog.conn.execute(
+        "SELECT l13_payload FROM l4_cohort_snapshot WHERE snapshot_id = ?",
+        [snapshot_id],
+    ).fetchone()
+    if row is None:
+        raise KeyError(f"snapshot not found: {snapshot_id!r}")
+    blob = row[0]
+    if not blob:
+        return pd.DataFrame()
+    table = pq.read_table(io.BytesIO(blob))
+    return table.to_pandas()
+
+
+def create_eval_set(
+    catalog,
+    *,
+    eval_set_id: str,
+    snapshot_id: str,
+    annotator_columns: Sequence[str],
+    target_labels: Sequence[str],
+    inter_observer_quantiles: Sequence[float] | None = None,
+    notes: Optional[str] = None,
+) -> EvalSet:
+    """Attach a new ``l4_eval_set`` row to *snapshot_id*.
+
+    Per I3, the same ``snapshot_id`` may be referenced by multiple
+    ``eval_set_id`` values (different annotator subsets, different
+    inter-observer quantiles, etc.). The integration test asserts this.
+    """
+    if inter_observer_quantiles is not None:
+        if len(inter_observer_quantiles) != 2:
+            raise ValueError(
+                "inter_observer_quantiles must have exactly two elements "
+                "[low, high]; got "
+                f"{list(inter_observer_quantiles)!r}"
+            )
+
+    # Validate the snapshot exists -- DuckDB's REFERENCES would also catch
+    # this but a friendlier error here saves an audit trail.
+    exists = catalog.conn.execute(
+        "SELECT 1 FROM l4_cohort_snapshot WHERE snapshot_id = ?", [snapshot_id]
+    ).fetchone()
+    if exists is None:
+        raise KeyError(f"snapshot not found: {snapshot_id!r}")
+
+    catalog.conn.execute(
+        """
+        INSERT OR REPLACE INTO l4_eval_set
+            (eval_set_id, snapshot_id, annotator_columns, target_labels,
+             inter_observer_quantiles, notes, created_at)
+        VALUES (?, ?, ?, ?, ?, ?, CURRENT_TIMESTAMP)
+        """,
+        [
+            eval_set_id,
+            snapshot_id,
+            list(annotator_columns),
+            list(target_labels),
+            list(inter_observer_quantiles) if inter_observer_quantiles else None,
+            notes,
+        ],
+    )
+
+    return EvalSet(
+        eval_set_id=eval_set_id,
+        snapshot_id=snapshot_id,
+        annotator_columns=tuple(annotator_columns),
+        target_labels=tuple(target_labels),
+        inter_observer_quantiles=(
+            tuple(inter_observer_quantiles) if inter_observer_quantiles else None
+        ),
+    )
+
+
+__all__ = [
+    "Snapshot",
+    "EvalSet",
+    "snapshot_cohort",
+    "create_eval_set",
+    "load_snapshot_payload",
+]
diff --git a/docs/snapshots.md b/docs/snapshots.md
new file mode 100644
index 0000000..786743c
--- /dev/null
+++ b/docs/snapshots.md
@@ -0,0 +1,138 @@
+# L4 cohort snapshots
+
+A **snapshot** is the immutable identity of one cohort selection. It
+captures every L1-L3 row that matched the selecting predicate at freeze
+time, hashes that frozen payload into `catalog_sha256`, and stores both
+the blob and the hash in `l4_cohort_snapshot`. The same predicate
+re-evaluated tomorrow against a mutated catalog will produce a
+**different** `snapshot_id` (and likely a different hash) -- that is the
+point. Two snapshots taken minutes apart against an unchanged catalog
+produce **identical** hashes -- also the point.
+
+This page describes the freeze semantics, the canonical serialisation
+rule, and the join surface that `l4_eval_set` exposes for the
+T2D inter-observer evaluation pipeline.
+
+## 1. Freeze semantics
+
+```python
+from datorcloud.snapshots import snapshot_cohort
+
+snap = snapshot_cohort(
+    catalog,
+    dataset_id="totalsegmentator",
+    predicate_sql="modality = 'CT' AND 'pelvis' = ANY(body_part)",
+    snapshot_date="2026-05-27",
+)
+print(snap.snapshot_id)        # totalsegmentator@2026-05-27
+print(snap.catalog_sha256)     # 64-character hex sha-256
+print(snap.n_records)          # number of distinct record_uids
+```
+
+Internally `snapshot_cohort()`:
+
+1. Evaluates `predicate_sql` against `v_doris` to enumerate the matching
+   `record_uid`s.
+2. Reads the full L1, L2, and L3 rows for those `record_uid`s into a
+   single long-format DataFrame with a `layer` discriminator column.
+3. Drops `l2_sensor.converted_uri` and `l1_experiment.ingested_at` from
+   the payload -- these are observability fields that may legitimately
+   mutate without altering the cohort identity (see §3 below).
+4. Computes `catalog_sha256` as the SHA-256 of the *canonical JSON*
+   serialisation of the payload (columns alphabetised, rows sorted
+   lexicographically, lists encoded as JSON arrays, timestamps in ISO
+   8601, NaN/NaT normalised to `null`).
+5. Serialises the same payload to a Parquet blob and writes
+   `(snapshot_id, catalog_sha256, n_records, schema_version,
+   l13_payload)` into `l4_cohort_snapshot`. `hf_publication_log` is
+   reserved for Phase 3.
+
+The Parquet blob is the storage format; the canonical JSON is what gets
+hashed. This split lets us optimise blob compression independently from
+the deterministic identity, and avoids the well-known PyArrow-version
+sensitivity of Parquet byte-level reproducibility.
+
+## 2. Reconstructing the payload
+
+```python
+from datorcloud.snapshots import load_snapshot_payload
+
+frozen = load_snapshot_payload(catalog, snap.snapshot_id)
+l1 = frozen[frozen["layer"] == "l1_experiment"]
+l3 = frozen[frozen["layer"] == "l3_annotation"]
+```
+
+The `(F)` operator (`DatorCloudOrchestrator.fetch`) and Phase 3's HF
+publisher both call `load_snapshot_payload` so downstream materialisation
+reads exactly the rows captured at snapshot time -- never the live
+tables. This is what guarantees the cross-tier identity gate in Phase 4
+(`build_cohort(source='hf').catalog_sha256 == build_cohort(source='minio').catalog_sha256`).
+
+## 3. Why `catalog_sha256` is insensitive to `converted_uri` writes
+
+After ingest, the raw -> NIfTI/Zarr conversion stage runs asynchronously
+and back-fills `l2_sensor.converted_uri` for each record. That URI is
+*provenance*, not *identity*: the same record converted on a different
+day still represents the same imaging examination.
+
+The snapshot freeze deliberately drops `converted_uri` from the
+canonical payload before hashing. Two snapshots of the same predicate
+-- one taken before the conversion stage runs, one taken after -- yield
+identical `catalog_sha256` values, which is the gate
+`doris-it-01-catalog` assertion (c) verifies:
+
+```python
+first = snapshot_cohort(catalog, dataset_id="ts", snapshot_date=today)
+
+catalog.update_l2_converted_uri(
+    record_uid="u_s1000", modality="CT", sequence="",
+    converted_uri="s3://orx-datalake/ts/s1000/ct.zarr",
+)
+
+second = snapshot_cohort(catalog, dataset_id="ts", snapshot_date=today)
+assert first.catalog_sha256 == second.catalog_sha256
+```
+
+## 4. Eval-set orthogonality (design invariant I3)
+
+A snapshot is *what data* you selected. An eval set is *how you score
+it* (which annotator columns to consult, which labels to evaluate,
+which inter-observer quantiles to use). The two are independent: one
+snapshot may carry multiple eval sets.
+
+```python
+from datorcloud.snapshots import create_eval_set
+
+create_eval_set(
+    catalog,
+    eval_set_id="pelvis_femur_v3",
+    snapshot_id=snap.snapshot_id,
+    annotator_columns=["radiologist_a", "radiologist_b"],
+    target_labels=["femur_left", "femur_right"],
+    inter_observer_quantiles=[0.25, 0.75],
+)
+
+create_eval_set(
+    catalog,
+    eval_set_id="pelvis_femur_v3_q10_q90",
+    snapshot_id=snap.snapshot_id,            # same snapshot, different quantiles
+    annotator_columns=["radiologist_a", "radiologist_b"],
+    target_labels=["femur_left", "femur_right"],
+    inter_observer_quantiles=[0.1, 0.9],
+)
+```
+
+The Phase 5 evaluation pipeline joins
+`l4_eval_set -> l4_cohort_snapshot` to recover both the data identity
+(`catalog_sha256`) and the scoring layout in a single query. The
+integration-test gate `doris-it-05-evaluation` assertion (f) exercises
+exactly this join.
+
+## 5. Versioning
+
+The `schema_version` stamped into every `l4_cohort_snapshot` row is the
+DDL version from `datorcloud/schemas/__init__.py::SCHEMA_VERSION`. A
+breaking change to the L1-L4 DDL bumps the major component and forces
+a `catalog_sha256` recomputation for every downstream consumer. Per the
+plan, that has not happened since 1.0.0 and is not expected before v2
+of the integration plan.
diff --git a/pyproject.toml b/pyproject.toml
index 200d868..b85489d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "datorcloud"
-version = "0.1.0"
+version = "0.2.0"
 description = "Modular, component-oriented framework for managing multimodal research data with MinIO and DuckDB."
 readme = "README.md"
 license = { text = "BSD-3-Clause" }
@@ -31,6 +31,7 @@ dependencies = [
     "minio>=7.1.15",
     "duckdb>=1.2.0",
     "pandas>=1.5.3",
+    "pyarrow>=14.0",
     "python-dotenv>=1.0.0",
 ]
 
@@ -66,6 +67,9 @@ Author = "https://github.com/jagh"
 include = ["datorcloud*"]
 exclude = ["tests*", "examples*", "build*", "docs*", "src*"]
 
+[tool.setuptools.package-data]
+"datorcloud.schemas" = ["*.sql"]
+
 [tool.pytest.ini_options]
 minversion = "7.0"
 testpaths = ["tests"]
@@ -73,6 +77,9 @@ addopts = "-ra"
 filterwarnings = [
     "ignore::DeprecationWarning",
 ]
+markers = [
+    "integration: end-to-end DORIS integration tests (doris-it-XX)",
+]
 
 [tool.ruff]
 line-length = 100
diff --git a/tests/integration/__init__.py b/tests/integration/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/tests/integration/test_01_catalog.py b/tests/integration/test_01_catalog.py
new file mode 100644
index 0000000..f912387
--- /dev/null
+++ b/tests/integration/test_01_catalog.py
@@ -0,0 +1,290 @@
+"""``doris-it-01-catalog`` -- Phase 1 integration test.
+
+Per STEP_BY_STEP_PLAN.md §3 the test runs the full
+``ingest -> query -> snapshot -> fetch -> eval_set`` path against a
+synthetic 5-subject TotalSegmentator v2 slice (``it_ts_5subj``). It is
+the system-level proof that:
+
+  (a) the DDL migration is idempotent (``schema_sha`` stable across two
+      runs),
+  (b) ``count(*) FROM l1_experiment WHERE dataset_id = 'totalsegmentator'``
+      equals 5 after ingest,
+  (c) the snapshot's ``catalog_sha256`` is identical on rerun, even after
+      ``l2_sensor.converted_uri`` is filled in between,
+  (d) ``fetch(snapshot_id=...)`` writes a byte-identical MIRO manifest on
+      rerun,
+  (e) two ``l4_eval_set`` rows pointing to the same ``snapshot_id`` are
+      legal,
+  (f) the ``Q`` operator returns the same rows whether queried through
+      raw DuckDB SQL or the wrapper API.
+
+This test runs entirely in-process: DuckDB in-memory, the parquet
+catalog rooted at ``tmp_path``, no MinIO, no GPU. The Phase 1 budget is
+under 60 seconds; on a stock laptop it completes in well under one.
+"""
+
+from __future__ import annotations
+
+from pathlib import Path
+
+import duckdb
+import pandas as pd
+import pytest
+
+from datorcloud.components.parquet_catalog_component import ParquetCatalogComponent
+from datorcloud.core import DatorCloudOrchestrator
+from datorcloud.schemas import Migration
+from datorcloud.snapshots import (
+    create_eval_set,
+    load_snapshot_payload,
+    snapshot_cohort,
+)
+
+pytestmark = pytest.mark.integration
+
+DATASET_ID = "totalsegmentator"
+DATASET_VERSION = "v2"
+SNAPSHOT_DATE = "2026-05-27"
+
+
+# ---------------------------------------------------------------------------
+# 5-subject TS slice fixture
+# ---------------------------------------------------------------------------
+
+
+def _it_ts_5subj() -> tuple[pd.DataFrame, pd.DataFrame, pd.DataFrame]:
+    """Synthetic stand-in for the on-disk ``it_ts_5subj`` fixture.
+
+    Five TS-v2 subjects with one CT volume each and two annotated
+    structures (``femur_left`` / ``femur_right``). Designed to validate
+    every assertion in the test plan without touching the network.
+    """
+    subjects = [f"s{1000 + i:04d}" for i in range(5)]
+
+    l1 = pd.DataFrame(
+        [
+            {
+                "record_uid": f"u_{sid}",
+                "dataset_id": DATASET_ID,
+                "dataset_version": DATASET_VERSION,
+                "subject_id": sid,
+                "study_id": "",
+                "cvpr_folder": None,
+                "body_part": ["pelvis"] if i % 2 == 0 else ["abdomen"],
+                "privacy_class": "public",
+                "license_spdx": "CC-BY-4.0",
+                "license_rule_version": "v1",
+                "redistribution_ok": True,
+                "hf_repo": "bal-dmu/msk-imaging",
+                "share_alike_obligation": False,
+                "source_doi": "10.5281/zenodo.10047292",
+                "source_url": "https://zenodo.org/record/10047292",
+            }
+            for i, sid in enumerate(subjects)
+        ]
+    )
+
+    l2 = pd.DataFrame(
+        [
+            {
+                "record_uid": f"u_{sid}",
+                "modality": "CT",
+                "sequence": "",
+                "raw_format": "nii.gz",
+                "raw_uri": f"s3://orx-datalake/{DATASET_ID}/{sid}/ct.nii.gz",
+                "voxel_spacing_mm": [1.5, 1.5, 1.5],
+                "slice_thickness_mm": 1.5,
+            }
+            for sid in subjects
+        ]
+    )
+
+    l3 = pd.DataFrame(
+        [
+            {
+                "record_uid": f"u_{sid}",
+                "label_canonical": label,
+                "annotator": "ts_v2",
+                "annotation_kind": "auto",
+                "instance_label": "semantic",
+                "mask_uri": f"s3://orx-datalake/{DATASET_ID}/{sid}/seg/{label}.nii.gz",
+            }
+            for sid in subjects
+            for label in ("femur_left", "femur_right")
+        ]
+    )
+
+    return l1, l2, l3
+
+
+# ---------------------------------------------------------------------------
+# Fixtures
+# ---------------------------------------------------------------------------
+
+
+@pytest.fixture
+def orchestrator(tmp_path) -> DatorCloudOrchestrator:
+    """A catalog-only orchestrator (no MinIO / no httpfs S3 in this path)."""
+    catalog = ParquetCatalogComponent(metadata_base_uri=str(tmp_path / "catalog"))
+    from datorcloud.components.minio_component import MinioObjectComponent
+    from datorcloud.components.query_component import QueryComponent
+
+    class _NoopClient:
+        def bucket_exists(self, bucket): return True
+        def make_bucket(self, bucket): return None
+        def fput_object(self, *a, **kw): return None
+        def fget_object(self, *a, **kw): return None
+
+    minio = MinioObjectComponent(client=_NoopClient())
+    # QueryComponent built around the same DuckDB connection so the
+    # legacy (Q) path and the new catalog views see the same state.
+    qc = QueryComponent.__new__(QueryComponent)
+    qc.conn = catalog.conn
+    return DatorCloudOrchestrator(
+        minio_component=minio,
+        query_component=qc,
+        parquet_catalog=catalog,
+        local_download_dir=str(tmp_path / "out"),
+    )
+
+
+@pytest.fixture
+def seeded_orchestrator(orchestrator: DatorCloudOrchestrator) -> DatorCloudOrchestrator:
+    l1, l2, l3 = _it_ts_5subj()
+    orchestrator.ingest("l1_experiment", l1)
+    orchestrator.ingest("l2_sensor", l2)
+    orchestrator.ingest("l3_annotation", l3)
+    return orchestrator
+
+
+# ---------------------------------------------------------------------------
+# Assertions
+# ---------------------------------------------------------------------------
+
+
+def test_a_ddl_migration_is_idempotent() -> None:
+    """Assertion (a): ``schema_sha`` is stable across two runs."""
+    conn = duckdb.connect(":memory:")
+    m = Migration.from_path()
+    sha1 = m.apply(conn).schema_sha
+    sha2 = m.apply(conn).schema_sha
+    assert sha1 == sha2
+
+
+def test_b_ingest_produces_expected_l1_count(
+    seeded_orchestrator: DatorCloudOrchestrator,
+) -> None:
+    """Assertion (b): 5 L1 rows after ingest."""
+    df = seeded_orchestrator.query(
+        sql=f"SELECT count(*) AS n FROM l1_experiment "
+        f"WHERE dataset_id = '{DATASET_ID}'"
+    )
+    assert int(df.iloc[0]["n"]) == 5
+
+
+def test_c_snapshot_sha_stable_across_converted_uri_writes(
+    seeded_orchestrator: DatorCloudOrchestrator,
+) -> None:
+    """Assertion (c): catalog_sha256 unchanged after async conversion writes."""
+    first = seeded_orchestrator.snapshot_cohort(
+        dataset_id=DATASET_ID, snapshot_date=SNAPSHOT_DATE
+    )
+    # Async conversion stage updates converted_uri on every L2 row.
+    for i in range(5):
+        seeded_orchestrator.parquet_catalog.update_l2_converted_uri(
+            record_uid=f"u_s{1000 + i:04d}",
+            modality="CT",
+            sequence="",
+            converted_uri=f"s3://orx-datalake/{DATASET_ID}/s{1000 + i:04d}/ct.zarr",
+        )
+    second = seeded_orchestrator.snapshot_cohort(
+        dataset_id=DATASET_ID, snapshot_date=SNAPSHOT_DATE
+    )
+    assert first.catalog_sha256 == second.catalog_sha256
+    assert first.n_records == 5 == second.n_records
+
+
+def test_d_fetch_writes_byte_identical_manifest(
+    seeded_orchestrator: DatorCloudOrchestrator, tmp_path
+) -> None:
+    """Assertion (d): two fetches produce byte-identical MIRO manifests."""
+    snap = seeded_orchestrator.snapshot_cohort(
+        dataset_id=DATASET_ID, snapshot_date=SNAPSHOT_DATE
+    )
+    out_a = seeded_orchestrator.fetch(snapshot_id=snap.snapshot_id, dest=str(tmp_path / "fa"))
+    out_b = seeded_orchestrator.fetch(snapshot_id=snap.snapshot_id, dest=str(tmp_path / "fb"))
+    assert out_a["manifest_sha256"] == out_b["manifest_sha256"]
+    assert out_a["catalog_sha256"] == out_b["catalog_sha256"] == snap.catalog_sha256
+    assert Path(out_a["manifest_path"]).exists()
+    assert Path(out_b["manifest_path"]).exists()
+    assert (
+        Path(out_a["manifest_path"]).read_bytes()
+        == Path(out_b["manifest_path"]).read_bytes()
+    )
+
+
+def test_e_two_eval_sets_share_one_snapshot(
+    seeded_orchestrator: DatorCloudOrchestrator,
+) -> None:
+    """Assertion (e): multiple eval sets per snapshot is legal."""
+    snap = seeded_orchestrator.snapshot_cohort(
+        dataset_id=DATASET_ID, snapshot_date=SNAPSHOT_DATE
+    )
+    seeded_orchestrator.create_eval_set(
+        eval_set_id="es_femur",
+        snapshot_id=snap.snapshot_id,
+        annotator_columns=["ts_v2"],
+        target_labels=["femur_left", "femur_right"],
+        inter_observer_quantiles=[0.25, 0.75],
+    )
+    seeded_orchestrator.create_eval_set(
+        eval_set_id="es_femur_left_only",
+        snapshot_id=snap.snapshot_id,
+        annotator_columns=["ts_v2"],
+        target_labels=["femur_left"],
+        inter_observer_quantiles=[0.1, 0.9],
+    )
+    rows = seeded_orchestrator.query(
+        sql=f"SELECT eval_set_id FROM l4_eval_set WHERE snapshot_id = '{snap.snapshot_id}'"
+    )
+    assert set(rows["eval_set_id"]) == {"es_femur", "es_femur_left_only"}
+
+
+def test_f_q_operator_matches_raw_sql(
+    seeded_orchestrator: DatorCloudOrchestrator,
+) -> None:
+    """Assertion (f): the wrapper Q API returns the same rows as raw SQL."""
+    via_wrapper = seeded_orchestrator.query(
+        view="v_doris", filters={"modality": "CT"}
+    )
+    via_sql = seeded_orchestrator.query(
+        sql="SELECT * FROM v_doris WHERE modality = 'CT'"
+    )
+    assert len(via_wrapper) == len(via_sql) == 5
+    assert sorted(via_wrapper["record_uid"]) == sorted(via_sql["record_uid"])
+
+
+def test_full_chain_summary(
+    seeded_orchestrator: DatorCloudOrchestrator, tmp_path
+) -> None:
+    """A second pass over the same orchestrator -- ingest is idempotent,
+    snapshot SHA stable, payload reconstructs."""
+    l1, l2, l3 = _it_ts_5subj()
+    # Re-ingest the same rows: counts must not double.
+    seeded_orchestrator.ingest("l1_experiment", l1)
+    seeded_orchestrator.ingest("l2_sensor", l2)
+    seeded_orchestrator.ingest("l3_annotation", l3)
+    df = seeded_orchestrator.query(
+        sql=f"SELECT count(*) AS n FROM l1_experiment WHERE dataset_id = '{DATASET_ID}'"
+    )
+    assert int(df.iloc[0]["n"]) == 5
+
+    snap = seeded_orchestrator.snapshot_cohort(
+        dataset_id=DATASET_ID, snapshot_date=SNAPSHOT_DATE
+    )
+    payload = load_snapshot_payload(seeded_orchestrator.parquet_catalog, snap.snapshot_id)
+    assert {"l1_experiment", "l2_sensor", "l3_annotation"} <= set(payload["layer"])
+
+    fetch = seeded_orchestrator.fetch(snapshot_id=snap.snapshot_id, dest=str(tmp_path / "final"))
+    assert fetch["n_records"] == 5
+    assert len(fetch["records"]) == 5
diff --git a/tests/test_cli.py b/tests/test_cli.py
index ffe08e8..796971c 100644
--- a/tests/test_cli.py
+++ b/tests/test_cli.py
@@ -33,3 +33,63 @@ def test_parse_kv_pairs_basic():
 
 def test_parse_filters_basic():
     assert cli._parse_filters(["camera_id=camera01"]) == {"camera_id": "camera01"}
+
+
+def test_cli_query_sql_against_local_catalog(tmp_path, capsys, monkeypatch):
+    """Phase 1 §3 step 1.3 CLI gate.
+
+    ``python -m datorcloud query --sql "SELECT count(*) FROM v_doris"``
+    must work end-to-end against a freshly-seeded local catalog without
+    requiring MinIO credentials.
+    """
+    catalog_dir = tmp_path / "catalog"
+    # Pre-seed the catalog with one L1 row so the count is non-zero and
+    # the test catches breakages in the wiring rather than a no-op pass.
+    from datorcloud.components.parquet_catalog_component import ParquetCatalogComponent
+    import pandas as pd
+
+    cat = ParquetCatalogComponent(metadata_base_uri=str(catalog_dir))
+    cat.write_rows(
+        "l1_experiment",
+        pd.DataFrame(
+            [
+                {
+                    "record_uid": "u1",
+                    "dataset_id": "totalsegmentator",
+                    "dataset_version": "v2",
+                    "subject_id": "s0011",
+                    "study_id": "",
+                    "privacy_class": "public",
+                    "license_spdx": "CC-BY-4.0",
+                    "redistribution_ok": True,
+                    "license_rule_version": "v1",
+                    "share_alike_obligation": False,
+                }
+            ]
+        ),
+    )
+    # The CLI builds a fresh orchestrator that points at the same
+    # ``catalog_base_uri`` directory. We pass the catalog through a
+    # monkeypatched factory so both orchestrators share state.
+    real_build = cli._build_orchestrator
+
+    def fake_build(args, *, require_minio=True):
+        orch = real_build(args, require_minio=require_minio)
+        orch.parquet_catalog = cat
+        return orch
+
+    monkeypatch.setattr(cli, "_build_orchestrator", fake_build)
+
+    rc = cli.main(
+        [
+            "query",
+            "--sql",
+            "SELECT count(*) AS n FROM v_doris",
+            "--catalog-base-uri",
+            str(catalog_dir),
+        ]
+    )
+    captured = capsys.readouterr()
+    assert rc == 0
+    # CSV output: "n\n1\n"
+    assert "1" in captured.out
diff --git a/tests/test_eval_set_join.py b/tests/test_eval_set_join.py
new file mode 100644
index 0000000..22a3f52
--- /dev/null
+++ b/tests/test_eval_set_join.py
@@ -0,0 +1,101 @@
+"""Phase 1 step 1.5 gate: multiple eval sets reference the same snapshot.
+
+This is design invariant I3 (snapshot ⟂ eval-set orthogonality) at the
+SQL layer: the join from ``l4_eval_set`` back to its parent
+``l4_cohort_snapshot`` must support an N:1 relationship.
+"""
+
+from __future__ import annotations
+
+import pandas as pd
+import pytest
+
+from datorcloud.components.parquet_catalog_component import ParquetCatalogComponent
+from datorcloud.snapshots import create_eval_set, snapshot_cohort
+
+
+@pytest.fixture
+def catalog(tmp_path) -> ParquetCatalogComponent:
+    return ParquetCatalogComponent(metadata_base_uri=str(tmp_path / "catalog"))
+
+
+def _seed(catalog: ParquetCatalogComponent) -> str:
+    catalog.write_rows(
+        "l1_experiment",
+        pd.DataFrame(
+            [
+                {
+                    "record_uid": "u1",
+                    "dataset_id": "ts",
+                    "dataset_version": "v2",
+                    "subject_id": "s1",
+                    "study_id": "",
+                    "privacy_class": "public",
+                    "license_spdx": "CC-BY-4.0",
+                    "redistribution_ok": True,
+                    "license_rule_version": "v1",
+                    "share_alike_obligation": False,
+                }
+            ]
+        ),
+    )
+    snap = snapshot_cohort(catalog, dataset_id="ts", snapshot_date="2026-05-27")
+    return snap.snapshot_id
+
+
+def test_two_eval_sets_share_one_snapshot(catalog: ParquetCatalogComponent) -> None:
+    sid = _seed(catalog)
+    create_eval_set(
+        catalog,
+        eval_set_id="es_pelvis",
+        snapshot_id=sid,
+        annotator_columns=["radiologist_a", "radiologist_b"],
+        target_labels=["femur_left"],
+        inter_observer_quantiles=[0.25, 0.75],
+    )
+    create_eval_set(
+        catalog,
+        eval_set_id="es_shoulder",
+        snapshot_id=sid,
+        annotator_columns=["radiologist_c", "radiologist_d"],
+        target_labels=["femur_right"],
+        inter_observer_quantiles=[0.1, 0.9],
+    )
+
+    rows = catalog.query("SELECT eval_set_id, snapshot_id FROM l4_eval_set ORDER BY eval_set_id")
+    assert len(rows) == 2
+    assert set(rows["snapshot_id"]) == {sid}  # both reference the same snapshot
+    assert set(rows["eval_set_id"]) == {"es_pelvis", "es_shoulder"}
+
+
+def test_eval_set_join_to_snapshot(catalog: ParquetCatalogComponent) -> None:
+    sid = _seed(catalog)
+    create_eval_set(
+        catalog,
+        eval_set_id="es_a",
+        snapshot_id=sid,
+        annotator_columns=["a"],
+        target_labels=["femur_left"],
+    )
+    joined = catalog.query(
+        """
+        SELECT es.eval_set_id, cs.snapshot_id, cs.n_records, cs.catalog_sha256
+          FROM l4_eval_set es
+          JOIN l4_cohort_snapshot cs USING (snapshot_id)
+         ORDER BY es.eval_set_id
+        """
+    )
+    assert len(joined) == 1
+    assert joined.iloc[0]["snapshot_id"] == sid
+    assert joined.iloc[0]["n_records"] == 1
+
+
+def test_eval_set_rejects_unknown_snapshot(catalog: ParquetCatalogComponent) -> None:
+    with pytest.raises(KeyError):
+        create_eval_set(
+            catalog,
+            eval_set_id="orphan",
+            snapshot_id="ghost@2026-05-27",
+            annotator_columns=["a"],
+            target_labels=["femur_left"],
+        )
diff --git a/tests/test_parquet_catalog_component.py b/tests/test_parquet_catalog_component.py
new file mode 100644
index 0000000..7676755
--- /dev/null
+++ b/tests/test_parquet_catalog_component.py
@@ -0,0 +1,215 @@
+"""Phase 1 step 1.2 gate: ``ParquetCatalogComponent`` end-to-end behaviour.
+
+Asserts:
+  * the DDL is applied on construction,
+  * ``v_doris`` and ``v_doris_egress`` views exist and respect the
+    license / privacy filter,
+  * round-trip writes land in the in-memory tables,
+  * ``materialize_parquet`` produces the hive layout
+    ``<base>/<layer>/dataset_id=<id>/dataset_version=<v>/part.parquet``
+    for L1-L3 layers and a flat file for L4 layers,
+  * the materialised files can be queried via ``read_parquet``
+    with hive partitioning.
+"""
+
+from __future__ import annotations
+
+from pathlib import Path
+
+import duckdb
+import pandas as pd
+import pytest
+
+from datorcloud.components.parquet_catalog_component import (
+    ParquetCatalogComponent,
+    HIVE_PARTITIONED_LAYERS,
+)
+
+
+def _sample_l1(record_uid: str = "u1", privacy: str = "public") -> pd.DataFrame:
+    return pd.DataFrame(
+        [
+            {
+                "record_uid": record_uid,
+                "dataset_id": "totalsegmentator",
+                "dataset_version": "v2",
+                "subject_id": f"s{record_uid}",
+                "study_id": "",
+                "privacy_class": privacy,
+                "license_spdx": "CC-BY-4.0",
+                "redistribution_ok": True,
+                "license_rule_version": "v1",
+                "share_alike_obligation": False,
+            }
+        ]
+    )
+
+
+def _sample_l2(record_uid: str = "u1", sequence: str = "") -> pd.DataFrame:
+    return pd.DataFrame(
+        [
+            {
+                "record_uid": record_uid,
+                "modality": "CT",
+                "sequence": sequence,
+                "raw_format": "nii.gz",
+                "raw_uri": f"s3://orx-datalake/totalsegmentator/{record_uid}/ct.nii.gz",
+            }
+        ]
+    )
+
+
+def _sample_l3(record_uid: str = "u1", label: str = "femur_left") -> pd.DataFrame:
+    return pd.DataFrame(
+        [
+            {
+                "record_uid": record_uid,
+                "label_canonical": label,
+                "annotator": "ts_v2",
+                "annotation_kind": "auto",
+                "instance_label": "semantic",
+                "mask_uri": f"s3://orx-datalake/totalsegmentator/{record_uid}/seg/{label}.nii.gz",
+            }
+        ]
+    )
+
+
+@pytest.fixture
+def catalog(tmp_path) -> ParquetCatalogComponent:
+    return ParquetCatalogComponent(metadata_base_uri=str(tmp_path / "catalog"))
+
+
+# ---------------------------------------------------------------------------
+# Construction / DDL surface
+# ---------------------------------------------------------------------------
+
+
+def test_ddl_applied_on_construction(catalog: ParquetCatalogComponent) -> None:
+    rows = catalog.conn.execute(
+        "SELECT table_name FROM information_schema.tables "
+        "WHERE table_type = 'BASE TABLE'"
+    ).fetchall()
+    table_names = {r[0] for r in rows}
+    for layer in ("l1_experiment", "l2_sensor", "l3_annotation", "l4_cohort_snapshot"):
+        assert layer in table_names
+
+
+def test_views_exist(catalog: ParquetCatalogComponent) -> None:
+    views = {
+        r[0]
+        for r in catalog.conn.execute(
+            "SELECT table_name FROM information_schema.views"
+        ).fetchall()
+    }
+    assert "v_doris" in views
+    assert "v_doris_egress" in views
+
+
+def test_schema_sha_set(catalog: ParquetCatalogComponent) -> None:
+    assert catalog.schema_sha
+    assert len(catalog.schema_sha) == 64
+
+
+# ---------------------------------------------------------------------------
+# Write / query round-trip
+# ---------------------------------------------------------------------------
+
+
+def test_write_rows_round_trip(catalog: ParquetCatalogComponent) -> None:
+    catalog.write_rows("l1_experiment", _sample_l1())
+    catalog.write_rows("l2_sensor", _sample_l2())
+    catalog.write_rows("l3_annotation", _sample_l3())
+
+    df = catalog.query("SELECT * FROM v_doris")
+    assert len(df) == 1
+    row = df.iloc[0]
+    assert row["record_uid"] == "u1"
+    assert row["modality"] == "CT"
+    assert "femur_left" in list(row["labels"])
+
+
+def test_v_doris_egress_filters_dua(catalog: ParquetCatalogComponent) -> None:
+    catalog.write_rows("l1_experiment", _sample_l1("u_public", "public"))
+    dua = _sample_l1("u_dua", "dua")
+    dua.loc[:, "redistribution_ok"] = False
+    catalog.write_rows("l1_experiment", dua)
+
+    public_only = catalog.query("SELECT record_uid FROM v_doris_egress")
+    assert set(public_only["record_uid"]) == {"u_public"}
+
+    everything = catalog.query("SELECT record_uid FROM v_doris")
+    assert set(everything["record_uid"]) == {"u_public", "u_dua"}
+
+
+def test_update_l2_converted_uri(catalog: ParquetCatalogComponent) -> None:
+    catalog.write_rows("l1_experiment", _sample_l1())
+    catalog.write_rows("l2_sensor", _sample_l2())
+    catalog.update_l2_converted_uri(
+        record_uid="u1",
+        modality="CT",
+        sequence="",
+        converted_uri="s3://orx-datalake/totalsegmentator/u1/ct.zarr",
+    )
+    row = catalog.query("SELECT converted_uri FROM l2_sensor").iloc[0]
+    assert row["converted_uri"].endswith("ct.zarr")
+
+
+def test_write_rows_rejects_unknown_layer(catalog: ParquetCatalogComponent) -> None:
+    with pytest.raises(ValueError):
+        catalog.write_rows("not_a_layer", pd.DataFrame([{"x": 1}]))
+
+
+# ---------------------------------------------------------------------------
+# Parquet materialisation -- hive layout
+# ---------------------------------------------------------------------------
+
+
+def test_materialize_parquet_hive_layout(catalog: ParquetCatalogComponent, tmp_path) -> None:
+    catalog.write_rows("l1_experiment", _sample_l1())
+    catalog.write_rows("l2_sensor", _sample_l2())
+    catalog.write_rows("l3_annotation", _sample_l3())
+
+    out = catalog.materialize_parquet()
+    for layer in ("l1_experiment", "l2_sensor", "l3_annotation"):
+        assert out[layer], f"no files written for {layer}"
+        path = Path(out[layer][0])
+        assert "dataset_id=totalsegmentator" in path.as_posix()
+        assert "dataset_version=v2" in path.as_posix()
+        assert path.exists()
+        assert layer in HIVE_PARTITIONED_LAYERS
+
+
+def test_materialised_parquet_reads_back_with_hive_partitioning(
+    catalog: ParquetCatalogComponent, tmp_path
+) -> None:
+    catalog.write_rows("l1_experiment", _sample_l1())
+    catalog.materialize_parquet()
+
+    # The hive layout must round-trip through a fresh DuckDB session
+    # using read_parquet(..., hive_partitioning=true). This is the
+    # protocol the Phase 4 HF httpfs reads also rely on.
+    base = Path(catalog.metadata_base_uri) / "l1_experiment"
+    glob = (base / "**" / "*.parquet").as_posix()
+    conn = duckdb.connect(":memory:")
+    df = conn.execute(
+        f"SELECT * FROM read_parquet('{glob}', hive_partitioning=true)"
+    ).fetchdf()
+    assert "dataset_id" in df.columns
+    assert "dataset_version" in df.columns
+    assert df.iloc[0]["dataset_id"] == "totalsegmentator"
+    assert df.iloc[0]["dataset_version"] == "v2"
+
+
+def test_l4_materialises_flat(catalog: ParquetCatalogComponent) -> None:
+    # Seed an L1 row so the snapshot has something to freeze.
+    catalog.write_rows("l1_experiment", _sample_l1())
+    catalog.write_rows("l2_sensor", _sample_l2())
+    from datorcloud.snapshots import snapshot_cohort
+
+    snapshot_cohort(catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27")
+
+    out = catalog.materialize_parquet(layers=["l4_cohort_snapshot"])
+    assert out["l4_cohort_snapshot"]
+    path = Path(out["l4_cohort_snapshot"][0])
+    assert "dataset_id=" not in path.as_posix()
+    assert path.name == "part.parquet"
diff --git a/tests/test_schema_migration.py b/tests/test_schema_migration.py
new file mode 100644
index 0000000..89ee0df
--- /dev/null
+++ b/tests/test_schema_migration.py
@@ -0,0 +1,148 @@
+"""Phase 1 step 1.1 gate: DDL migration is idempotent.
+
+Per STEP_BY_STEP_PLAN.md §3 step 1.1, ``schemas/l1_l4.sql`` must:
+
+  (a) apply cleanly to a fresh DuckDB connection,
+  (b) re-apply without error (idempotent),
+  (c) expose a stable ``schema_sha`` across two runs on an unchanged
+      checkout (this is the same property that integration-test
+      ``doris-it-01-catalog`` assertion (a) checks system-wide).
+"""
+
+from __future__ import annotations
+
+import duckdb
+import pytest
+
+from datorcloud.schemas import Migration, SCHEMA_VERSION
+
+
+def test_schema_version_string_present() -> None:
+    assert SCHEMA_VERSION.count(".") == 2
+
+
+def test_apply_creates_every_layer() -> None:
+    conn = duckdb.connect(":memory:")
+    Migration.from_path().apply(conn)
+    tables = {
+        row[0]
+        for row in conn.execute(
+            "SELECT table_name FROM information_schema.tables "
+            "WHERE table_schema = 'main' AND table_type = 'BASE TABLE'"
+        ).fetchall()
+    }
+    expected = {
+        "l1_experiment",
+        "l1_citations",
+        "l1_processing",
+        "l2_sensor",
+        "l3_annotation",
+        "l4_cohort_snapshot",
+        "l4_eval_set",
+    }
+    assert expected.issubset(tables), f"missing tables: {expected - tables}"
+
+
+def test_apply_creates_every_enum() -> None:
+    conn = duckdb.connect(":memory:")
+    Migration.from_path().apply(conn)
+    type_names = {
+        row[0] for row in conn.execute("SELECT type_name FROM duckdb_types()").fetchall()
+    }
+    for enum in ("privacy_class", "annotation_kind", "instance_label", "processing_stage"):
+        assert enum in type_names, f"ENUM {enum!r} not registered"
+
+
+def test_apply_is_idempotent_no_errors() -> None:
+    conn = duckdb.connect(":memory:")
+    m = Migration.from_path()
+    r1 = m.apply(conn)
+    r2 = m.apply(conn)
+    # All statements either applied or were silently skipped because
+    # the entity already exists; either way no error escapes.
+    assert r1.schema_sha == r2.schema_sha
+    assert r1.schema_version == r2.schema_version
+
+
+def test_schema_sha_stable_across_reruns(tmp_path) -> None:
+    """``schema_sha`` is a pure function of the DDL text, not of the
+    connection state. Two runs on the same checkout produce identical
+    hashes.
+    """
+    a = Migration.from_path().schema_sha
+    b = Migration.from_path().schema_sha
+    assert a == b
+    assert len(a) == 64  # hex sha-256
+
+
+def test_schema_sha_insensitive_to_comments() -> None:
+    """Comments and surrounding whitespace must not affect ``schema_sha``.
+
+    Token-level whitespace inside a statement (e.g. ``(x INTEGER)`` vs
+    ``( x INTEGER )``) IS semantically distinct in the DDL and therefore
+    DOES change the hash -- that distinction is intentional.
+    """
+    base = """
+    -- one comment
+    CREATE TABLE IF NOT EXISTS demo (x INTEGER);
+    """
+    same_no_comments = "\n   CREATE TABLE IF NOT EXISTS demo (x INTEGER);\n"
+    different_comment = """
+    -- a completely different comment
+    CREATE TABLE IF NOT EXISTS demo (x INTEGER);
+    """
+    assert (
+        Migration.from_text(base).schema_sha
+        == Migration.from_text(same_no_comments).schema_sha
+        == Migration.from_text(different_comment).schema_sha
+    )
+
+
+def test_l1_unique_key_includes_study_id() -> None:
+    """STEP_BY_STEP_PLAN.md §3 step 1.1: DICOM rows with multiple
+    ``study_id`` values for the same ``subject_id`` must not collide.
+    """
+    conn = duckdb.connect(":memory:")
+    Migration.from_path().apply(conn)
+    conn.execute(
+        """
+        INSERT INTO l1_experiment
+            (record_uid, dataset_id, dataset_version, subject_id, study_id,
+             privacy_class, license_spdx, redistribution_ok)
+        VALUES
+            ('u1', 'tcia', 'idc_v18', 'sub-001', 'study-A',
+             'public', 'CC-BY-4.0', TRUE),
+            ('u2', 'tcia', 'idc_v18', 'sub-001', 'study-B',
+             'public', 'CC-BY-4.0', TRUE)
+        """
+    )
+    n = conn.execute("SELECT count(*) FROM l1_experiment").fetchone()[0]
+    assert n == 2
+
+
+def test_l2_unique_key_splits_compound_modalities() -> None:
+    """L2 must accept the same record under multiple (modality, sequence)
+    pairs so CVPR ``"MR (T2, ADC)"`` strings split losslessly.
+    """
+    conn = duckdb.connect(":memory:")
+    Migration.from_path().apply(conn)
+    conn.execute(
+        """
+        INSERT INTO l1_experiment
+            (record_uid, dataset_id, dataset_version, subject_id, study_id,
+             privacy_class, license_spdx, redistribution_ok)
+        VALUES ('u1', 'mri_ts', 'v2', 'sub-001', '',
+                'public', 'CC-BY-4.0', TRUE)
+        """
+    )
+    conn.execute(
+        """
+        INSERT INTO l2_sensor
+            (record_uid, modality, sequence, raw_format)
+        VALUES
+            ('u1', 'MR', 'T2', 'nii.gz'),
+            ('u1', 'MR', 'ADC', 'nii.gz')
+        """
+    )
+    n = conn.execute("SELECT count(*) FROM l2_sensor").fetchone()[0]
+    assert n == 2
diff --git a/tests/test_snapshots.py b/tests/test_snapshots.py
new file mode 100644
index 0000000..5ad2033
--- /dev/null
+++ b/tests/test_snapshots.py
@@ -0,0 +1,252 @@
+"""Phase 1 step 1.4 gate: L4 snapshot freeze.
+
+Asserts:
+  * ``snapshot_cohort`` writes one row to ``l4_cohort_snapshot``,
+  * ``catalog_sha256`` is byte-identical across two consecutive
+    snapshots of the same cohort **even after**
+    ``l2_sensor.converted_uri`` mutates between the two snapshots,
+  * ``load_snapshot_payload`` reconstructs the frozen rows.
+
+This is the property that integration-test ``doris-it-01-catalog``
+assertion (c) exercises at the system level.
+"""
+
+from __future__ import annotations
+
+import pandas as pd
+import pytest
+
+from datorcloud.components.parquet_catalog_component import ParquetCatalogComponent
+from datorcloud.snapshots import (
+    create_eval_set,
+    load_snapshot_payload,
+    snapshot_cohort,
+)
+
+
+@pytest.fixture
+def catalog(tmp_path) -> ParquetCatalogComponent:
+    return ParquetCatalogComponent(metadata_base_uri=str(tmp_path / "catalog"))
+
+
+def _seed_two_subjects(catalog: ParquetCatalogComponent) -> None:
+    l1 = pd.DataFrame(
+        [
+            {
+                "record_uid": "u1",
+                "dataset_id": "totalsegmentator",
+                "dataset_version": "v2",
+                "subject_id": "s0011",
+                "study_id": "",
+                "privacy_class": "public",
+                "license_spdx": "CC-BY-4.0",
+                "redistribution_ok": True,
+                "license_rule_version": "v1",
+                "share_alike_obligation": False,
+            },
+            {
+                "record_uid": "u2",
+                "dataset_id": "totalsegmentator",
+                "dataset_version": "v2",
+                "subject_id": "s0012",
+                "study_id": "",
+                "privacy_class": "public",
+                "license_spdx": "CC-BY-4.0",
+                "redistribution_ok": True,
+                "license_rule_version": "v1",
+                "share_alike_obligation": False,
+            },
+        ]
+    )
+    l2 = pd.DataFrame(
+        [
+            {
+                "record_uid": "u1",
+                "modality": "CT",
+                "sequence": "",
+                "raw_format": "nii.gz",
+                "raw_uri": "s3://orx-datalake/totalsegmentator/u1/ct.nii.gz",
+            },
+            {
+                "record_uid": "u2",
+                "modality": "CT",
+                "sequence": "",
+                "raw_format": "nii.gz",
+                "raw_uri": "s3://orx-datalake/totalsegmentator/u2/ct.nii.gz",
+            },
+        ]
+    )
+    l3 = pd.DataFrame(
+        [
+            {
+                "record_uid": "u1",
+                "label_canonical": "femur_left",
+                "annotator": "ts_v2",
+                "annotation_kind": "auto",
+                "instance_label": "semantic",
+                "mask_uri": "s3://orx-datalake/totalsegmentator/u1/seg/femur_left.nii.gz",
+            },
+            {
+                "record_uid": "u2",
+                "label_canonical": "femur_left",
+                "annotator": "ts_v2",
+                "annotation_kind": "auto",
+                "instance_label": "semantic",
+                "mask_uri": "s3://orx-datalake/totalsegmentator/u2/seg/femur_left.nii.gz",
+            },
+        ]
+    )
+    catalog.write_rows("l1_experiment", l1)
+    catalog.write_rows("l2_sensor", l2)
+    catalog.write_rows("l3_annotation", l3)
+
+
+# ---------------------------------------------------------------------------
+# Freeze semantics
+# ---------------------------------------------------------------------------
+
+
+def test_snapshot_writes_row(catalog: ParquetCatalogComponent) -> None:
+    _seed_two_subjects(catalog)
+    snap = snapshot_cohort(
+        catalog,
+        dataset_id="totalsegmentator",
+        snapshot_date="2026-05-27",
+    )
+    assert snap.snapshot_id == "totalsegmentator@2026-05-27"
+    assert snap.n_records == 2
+    assert len(snap.catalog_sha256) == 64
+
+    row = catalog.query(
+        "SELECT * FROM l4_cohort_snapshot WHERE snapshot_id = ?",
+        params=[snap.snapshot_id],
+    )
+    assert len(row) == 1
+    assert row.iloc[0]["n_records"] == 2
+    assert row.iloc[0]["catalog_sha256"] == snap.catalog_sha256
+
+
+def test_snapshot_sha_stable_across_reruns(catalog: ParquetCatalogComponent) -> None:
+    _seed_two_subjects(catalog)
+    a = snapshot_cohort(
+        catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27"
+    )
+    b = snapshot_cohort(
+        catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27"
+    )
+    assert a.catalog_sha256 == b.catalog_sha256
+    assert a.n_records == b.n_records
+
+
+def test_snapshot_sha_stable_after_converted_uri_writes(
+    catalog: ParquetCatalogComponent,
+) -> None:
+    """Phase 1 §3 step 1.4 + integration-test assertion (c).
+
+    A snapshot's ``catalog_sha256`` must remain identical even after
+    asynchronous writes to ``l2_sensor.converted_uri`` between two
+    consecutive snapshots of the same cohort.
+    """
+    _seed_two_subjects(catalog)
+    first = snapshot_cohort(
+        catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27"
+    )
+
+    # Simulate the conversion stage filling in converted_uri for both
+    # subjects after the first snapshot was frozen.
+    for uid in ("u1", "u2"):
+        catalog.update_l2_converted_uri(
+            record_uid=uid,
+            modality="CT",
+            sequence="",
+            converted_uri=f"s3://orx-datalake/totalsegmentator/{uid}/ct.zarr",
+        )
+
+    second = snapshot_cohort(
+        catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27"
+    )
+    assert first.catalog_sha256 == second.catalog_sha256, (
+        "snapshot hash must be insensitive to asynchronous converted_uri "
+        "writes (Phase 1 §3 step 1.4)"
+    )
+
+
+def test_snapshot_predicate_filters_rows(catalog: ParquetCatalogComponent) -> None:
+    _seed_two_subjects(catalog)
+    snap = snapshot_cohort(
+        catalog,
+        dataset_id="totalsegmentator",
+        predicate_sql="subject_id = 's0011'",
+        snapshot_date="2026-05-27",
+    )
+    assert snap.n_records == 1
+    payload = load_snapshot_payload(catalog, snap.snapshot_id)
+    l1_rows = payload[payload["layer"] == "l1_experiment"]
+    assert list(l1_rows["subject_id"]) == ["s0011"]
+
+
+def test_load_snapshot_payload_round_trip(catalog: ParquetCatalogComponent) -> None:
+    _seed_two_subjects(catalog)
+    snap = snapshot_cohort(
+        catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27"
+    )
+    payload = load_snapshot_payload(catalog, snap.snapshot_id)
+    assert {"l1_experiment", "l2_sensor", "l3_annotation"} <= set(payload["layer"])
+    assert set(payload[payload["layer"] == "l1_experiment"]["record_uid"]) == {"u1", "u2"}
+
+
+def test_load_snapshot_payload_missing(catalog: ParquetCatalogComponent) -> None:
+    with pytest.raises(KeyError):
+        load_snapshot_payload(catalog, "nonexistent@2026-05-27")
+
+
+# ---------------------------------------------------------------------------
+# Eval-set creation (Phase 1 step 1.5)
+# ---------------------------------------------------------------------------
+
+
+def test_create_eval_set_attaches(catalog: ParquetCatalogComponent) -> None:
+    _seed_two_subjects(catalog)
+    snap = snapshot_cohort(
+        catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27"
+    )
+    es = create_eval_set(
+        catalog,
+        eval_set_id="shoulder_ct_v3",
+        snapshot_id=snap.snapshot_id,
+        annotator_columns=["annotator_a", "annotator_b"],
+        target_labels=["femur_left", "femur_right"],
+        inter_observer_quantiles=[0.25, 0.75],
+    )
+    assert es.eval_set_id == "shoulder_ct_v3"
+    rows = catalog.query("SELECT * FROM l4_eval_set")
+    assert len(rows) == 1
+
+
+def test_create_eval_set_unknown_snapshot_raises(catalog: ParquetCatalogComponent) -> None:
+    with pytest.raises(KeyError):
+        create_eval_set(
+            catalog,
+            eval_set_id="x",
+            snapshot_id="nonexistent@2026-05-27",
+            annotator_columns=["a"],
+            target_labels=["femur_left"],
+        )
+
+
+def test_create_eval_set_validates_quantile_arity(
+    catalog: ParquetCatalogComponent,
+) -> None:
+    _seed_two_subjects(catalog)
+    snap = snapshot_cohort(
+        catalog, dataset_id="totalsegmentator", snapshot_date="2026-05-27"
+    )
+    with pytest.raises(ValueError):
+        create_eval_set(
+            catalog,
+            eval_set_id="bad",
+            snapshot_id=snap.snapshot_id,
+            annotator_columns=["a"],
+            target_labels=["femur_left"],
+            inter_observer_quantiles=[0.5],  # only one value, not two
+        )