From 37cafc87dd8a7f13571dec33857bc3e437183d5d Mon Sep 17 00:00:00 2001
From: jdsika <carlo.van-driesten@bmw.de>
Date: Thu, 26 Mar 2026 17:16:37 +0100
Subject: [PATCH] feat(generators): add --deterministic flag for reproducible
 output
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Add a --deterministic flag to OWL, SHACL, and JSON-LD generators that
produces byte-identical output across invocations, eliminating spurious
diffs in version-controlled artifacts.

Deterministic Turtle serialization (deterministic_turtle):
- W3C RDFC-1.0 canonicalization via pyoxigraph (standard-compliant)
- Weisfeiler-Lehman structural hashing for diff-stable blank node IDs
  (_:b<hash>) instead of sequential (_:c14nN)
- Sorted prefix declarations and triple blocks

Collection sorting (gated behind --deterministic):
- owl:oneOf, sh:in, sh:ignoredProperties items sorted when flag is set
- Preserves existing behaviour by default

deterministic_json:
- Recursive deep-sort for JSON-LD context output

pyoxigraph >= 0.4.0 is imported lazily and only when --deterministic is
used. Not a core dependency — avoids conflict with morph-kgc. Tests skip
gracefully when pyoxigraph >= 0.4.0 is unavailable.

Signed-off-by: jdsika <carlo.van-driesten@bmw.de>
---
 .../src/linkml/generators/jsonldcontextgen.py |  54 +++
 .../linkml/src/linkml/generators/jsonldgen.py |   5 +
 .../linkml/src/linkml/generators/owlgen.py    |  14 +-
 .../linkml/src/linkml/generators/shaclgen.py  |  21 +-
 packages/linkml/src/linkml/utils/generator.py | 308 ++++++++++++++-
 .../test_deterministic_benchmark.py           | 368 ++++++++++++++++++
 .../test_deterministic_output.py              | 363 +++++++++++++++++
 7 files changed, 1124 insertions(+), 9 deletions(-)
 create mode 100644 tests/linkml/test_generators/test_deterministic_benchmark.py
 create mode 100644 tests/linkml/test_generators/test_deterministic_output.py
diff --git a/packages/linkml/src/linkml/generators/jsonldcontextgen.py b/packages/linkml/src/linkml/generators/jsonldcontextgen.py
index 60eaa9ffd..1c6cec148 100644
--- a/packages/linkml/src/linkml/generators/jsonldcontextgen.py
+++ b/packages/linkml/src/linkml/generators/jsonldcontextgen.py
@@ -189,8 +189,62 @@ def end_schema(
             with open(frame_path, "w", encoding="UTF-8") as f:
                 json.dump(frame, f, indent=2, ensure_ascii=False)
 
+        if self.deterministic:
+            return self._deterministic_context_json(json.loads(str(as_json(context))), indent=3) + "\n"
         return str(as_json(context)) + "\n"
 
+    @staticmethod
+    def _deterministic_context_json(data: dict, indent: int = 3) -> str:
+        """Serialize a JSON-LD context with deterministic key ordering.
+
+        Preserves the conventional JSON-LD context structure:
+        1. ``comments`` block first (metadata)
+        2. ``@context`` block second, with:
+           a. ``@``-prefixed directives (``@vocab``, ``@base``) first
+           b. Prefix declarations (string values) second
+           c. Class/property term entries (object values) last
+        3. Each group sorted alphabetically within itself
+
+        Unlike :func:`deterministic_json`, this understands JSON-LD
+        conventions so that the output remains human-readable while
+        still being byte-identical across invocations.
+        """
+        from linkml.utils.generator import deterministic_json
+
+        ordered = {}
+
+        # 1. "comments" first (if present)
+        if "comments" in data:
+            ordered["comments"] = data["comments"]
+
+        # 2. "@context" with structured internal ordering
+        if "@context" in data:
+            ctx = data["@context"]
+            ordered_ctx = {}
+
+            # 2a. @-prefixed directives (@vocab, @base, etc.)
+            for k in sorted(k for k in ctx if k.startswith("@")):
+                ordered_ctx[k] = ctx[k]
+
+            # 2b. Prefix declarations (string values — short namespace URIs)
+            for k in sorted(k for k in ctx if not k.startswith("@") and isinstance(ctx[k], str)):
+                ordered_ctx[k] = ctx[k]
+
+            # 2c. Term definitions (object values) — deep-sorted for determinism
+            term_entries = {k: v for k, v in ctx.items() if not k.startswith("@") and not isinstance(v, str)}
+            sorted_terms = json.loads(deterministic_json(term_entries))
+            for k in sorted(sorted_terms):
+                ordered_ctx[k] = sorted_terms[k]
+
+            ordered["@context"] = ordered_ctx
+
+        # 3. Any remaining top-level keys
+        for k in sorted(data):
+            if k not in ordered:
+                ordered[k] = data[k]
+
+        return json.dumps(ordered, indent=indent, ensure_ascii=False)
+
     def visit_class(self, cls: ClassDefinition) -> bool:
         if self.exclude_imports and cls.name not in self._local_classes:
             return False
diff --git a/packages/linkml/src/linkml/generators/jsonldgen.py b/packages/linkml/src/linkml/generators/jsonldgen.py
index c974e762d..0c9c87cbb 100644
--- a/packages/linkml/src/linkml/generators/jsonldgen.py
+++ b/packages/linkml/src/linkml/generators/jsonldgen.py
@@ -1,5 +1,6 @@
 """Generate JSONld from a LinkML schema."""
 
+import json
 import os
 from collections.abc import Sequence
 from copy import deepcopy
@@ -202,6 +203,10 @@ def end_schema(self, context: str | Sequence[str] | None = None, context_kwargs:
                 self.schema["@context"].append({"@base": base_prefix})
         # json_obj["@id"] = self.schema.id
         out = str(as_json(self.schema, indent="  ")) + "\n"
+        if self.deterministic:
+            from linkml.utils.generator import deterministic_json
+
+            out = deterministic_json(json.loads(out), indent=2) + "\n"
         self.schema = self.original_schema
         return out
 
diff --git a/packages/linkml/src/linkml/generators/owlgen.py b/packages/linkml/src/linkml/generators/owlgen.py
index 33c58b0ec..4ab4b8cf3 100644
--- a/packages/linkml/src/linkml/generators/owlgen.py
+++ b/packages/linkml/src/linkml/generators/owlgen.py
@@ -267,7 +267,14 @@ def serialize(self, **kwargs) -> str:
         :return:
         """
         self.as_graph()
-        data = self.graph.serialize(format="turtle" if self.format in ["owl", "ttl"] else self.format)
+        fmt = "turtle" if self.format in ["owl", "ttl"] else self.format
+        if self.deterministic and fmt == "turtle":
+            # Deferred to avoid circular import (generator.py imports from this package)
+            from linkml.utils.generator import deterministic_turtle
+
+            data = deterministic_turtle(self.graph)
+        else:
+            data = self.graph.serialize(format=fmt)
         return data
 
     def add_metadata(self, e: Definition | PermissibleValue, uri: URIRef) -> None:
@@ -998,7 +1005,10 @@ def add_enum(self, e: EnumDefinition) -> None:
         owl_types = []
         enum_owl_type = self._get_metatype(e, self.default_permissible_value_type)
 
-        for pv in e.permissible_values.values():
+        pvs = e.permissible_values.values()
+        if self.deterministic:
+            pvs = sorted(pvs, key=lambda x: x.text)
+        for pv in pvs:
             pv_owl_type = self._get_metatype(pv, enum_owl_type)
             owl_types.append(pv_owl_type)
             if pv_owl_type == RDFS.Literal:
diff --git a/packages/linkml/src/linkml/generators/shaclgen.py b/packages/linkml/src/linkml/generators/shaclgen.py
index 5425051e3..ec78e7ba5 100644
--- a/packages/linkml/src/linkml/generators/shaclgen.py
+++ b/packages/linkml/src/linkml/generators/shaclgen.py
@@ -93,7 +93,13 @@ def generate_header(self) -> str:
 
     def serialize(self, **args) -> str:
         g = self.as_graph()
-        data = g.serialize(format="turtle" if self.format in ["owl", "ttl"] else self.format)
+        fmt = "turtle" if self.format in ["owl", "ttl"] else self.format
+        if self.deterministic and fmt == "turtle":
+            from linkml.utils.generator import deterministic_turtle
+
+            data = deterministic_turtle(g)
+        else:
+            data = g.serialize(format=fmt)
         return data
 
     def as_graph(self) -> Graph:
@@ -309,13 +315,13 @@ def _add_enum(self, g: Graph, func: Callable, r: ElementName) -> None:
         sv = self.schemaview
         enum = sv.get_enum(r)
         pv_node = BNode()
+        pv_items = list(enum.permissible_values.items())
+        if self.deterministic:
+            pv_items = sorted(pv_items)
         Collection(
             g,
             pv_node,
-            [
-                URIRef(sv.expand_curie(pv.meaning)) if pv.meaning else Literal(pv_name)
-                for pv_name, pv in enum.permissible_values.items()
-            ],
+            [URIRef(sv.expand_curie(pv.meaning)) if pv.meaning else Literal(pv_name) for pv_name, pv in pv_items],
         )
         func(SH["in"], pv_node)
 
@@ -469,7 +475,10 @@ def collect_child_properties(class_name: str, output: set) -> None:
 
         list_node = BNode()
         ignored_properties.add(RDF.type)
-        Collection(g, list_node, list(ignored_properties))
+        props = list(ignored_properties)
+        if self.deterministic:
+            props = sorted(props, key=str)
+        Collection(g, list_node, props)
 
         return list_node
 
diff --git a/packages/linkml/src/linkml/utils/generator.py b/packages/linkml/src/linkml/utils/generator.py
index 88fc48585..db9c00232 100644
--- a/packages/linkml/src/linkml/utils/generator.py
+++ b/packages/linkml/src/linkml/utils/generator.py
@@ -24,7 +24,7 @@
 from dataclasses import dataclass, field
 from functools import lru_cache
 from pathlib import Path
-from typing import ClassVar, TextIO, Union, cast
+from typing import TYPE_CHECKING, ClassVar, TextIO, Union, cast
 
 import click
 from click import Argument, Command, Option
@@ -37,6 +37,10 @@
 from linkml.utils.schemaloader import SchemaLoader
 from linkml.utils.typereferences import References
 from linkml_runtime import SchemaView
+
+if TYPE_CHECKING:
+    from rdflib import Graph as RdfGraph
+
 from linkml_runtime.linkml_model.meta import (
     ClassDefinition,
     ClassDefinitionName,
@@ -78,6 +82,281 @@ def _resolved_metamodel(mergeimports):
     return metamodel
 
 
+def _wl_signatures(
+    quads: list,
+    iterations: int = 4,
+) -> dict[str, str]:
+    """Compute Weisfeiler-Lehman structural signatures for blank nodes.
+
+    Uses 1-dimensional WL colour refinement [1]_ to assign each blank
+    node a deterministic signature derived from its multi-hop
+    neighbourhood structure.  The signature depends only on predicate
+    IRIs, literal values, and named-node IRIs — **not** on blank-node
+    identifiers — so it remains stable when unrelated triples are added
+    or removed.
+
+    Parameters
+    ----------
+    quads : list
+        Canonical quads from pyoxigraph (after RDFC-1.0).
+    iterations : int
+        Number of WL refinement rounds (default 4).
+
+    Returns
+    -------
+    dict[str, str]
+        Mapping from canonical blank-node ID (e.g. ``c14n42``) to a
+        truncated SHA-256 hash suitable for use as a stable blank-node
+        label.
+
+    References
+    ----------
+    .. [1] Weisfeiler, B. & Leman, A. (1968). "The reduction of a graph
+       to canonical form and the algebra which appears therein."
+    """
+    import hashlib
+
+    try:
+        import pyoxigraph
+    except ImportError as exc:
+        raise ImportError(
+            "pyoxigraph >= 0.4.0 is required for --deterministic output. "
+            "Install it with: pip install 'pyoxigraph>=0.4.0'"
+        ) from exc
+
+    # Collect all blank node IDs and build adjacency index.
+    bnode_ids: set[str] = set()
+    # outgoing[b] = list of (predicate_str, object_str_or_bnode_id, is_bnode)
+    outgoing: dict[str, list[tuple[str, str, bool]]] = {}
+    # incoming[b] = list of (subject_str_or_bnode_id, predicate_str, is_bnode)
+    incoming: dict[str, list[tuple[str, str, bool]]] = {}
+
+    for q in quads:
+        s, p, o = q.subject, q.predicate, q.object
+        s_is_bn = isinstance(s, pyoxigraph.BlankNode)
+        o_is_bn = isinstance(o, pyoxigraph.BlankNode)
+        p_str = str(p)
+
+        if s_is_bn:
+            bnode_ids.add(s.value)
+            outgoing.setdefault(s.value, []).append((p_str, o.value if o_is_bn else str(o), o_is_bn))
+        if o_is_bn:
+            bnode_ids.add(o.value)
+            incoming.setdefault(o.value, []).append((s.value if s_is_bn else str(s), p_str, s_is_bn))
+
+    # Initialise signatures: named-node edges only (no bnode IDs).
+    sig: dict[str, str] = {}
+    for bid in bnode_ids:
+        parts = []
+        for p_str, o_str, o_is_bn in outgoing.get(bid, []):
+            if not o_is_bn:
+                parts.append(f"+{p_str}={o_str}")
+        for s_str, p_str, s_is_bn in incoming.get(bid, []):
+            if not s_is_bn:
+                parts.append(f"-{s_str}={p_str}")
+        sig[bid] = "|".join(sorted(parts))
+
+    # Iterative refinement: incorporate neighbour signatures.
+    for _ in range(iterations):
+        new_sig: dict[str, str] = {}
+        for bid in bnode_ids:
+            parts = [sig[bid]]
+            for p_str, o_str, o_is_bn in outgoing.get(bid, []):
+                if o_is_bn:
+                    parts.append(f"+{p_str}={sig.get(o_str, '')}")
+            for s_str, p_str, s_is_bn in incoming.get(bid, []):
+                if s_is_bn:
+                    parts.append(f"-{sig.get(s_str, '')}={p_str}")
+            new_sig[bid] = "|".join(sorted(parts))
+        sig = new_sig
+
+    # Convert signatures to truncated SHA-256 hashes.
+    # Use 12 hex chars (48 bits) — collision probability < 1 in 2^24
+    # for typical LinkML graphs with <100k blank nodes.
+    hash_map: dict[str, str] = {}
+    seen_hashes: dict[str, int] = {}
+    for bid in sorted(bnode_ids):
+        digest = hashlib.sha256(sig[bid].encode("utf-8")).hexdigest()[:12]
+        # Handle collisions by appending a counter.
+        count = seen_hashes.get(digest, 0)
+        seen_hashes[digest] = count + 1
+        label = f"b{digest}" if count == 0 else f"b{digest}_{count}"
+        hash_map[bid] = label
+
+    return hash_map
+
+
+def deterministic_turtle(graph: "RdfGraph") -> str:
+    """Serialize an RDF graph to Turtle with deterministic output ordering.
+
+    Uses a three-phase hybrid pipeline for **correctness**, **diff
+    stability**, and **readability**:
+
+    1. **RDFC-1.0** [1]_ (via ``pyoxigraph``) canonicalizes the graph,
+       ensuring isomorphic inputs produce identical triple sets.
+    2. **Weisfeiler-Lehman structural hashing** replaces the sequential
+       ``_:c14nN`` identifiers with content-based hashes derived from
+       each blank node's multi-hop neighbourhood.  These hashes depend
+       only on predicate IRIs, literal values, and named-node IRIs —
+       not on blank-node numbering — so adding or removing a triple
+       only affects the identifiers of directly involved blank nodes.
+    3. **Hybrid rdflib re-serialization** parses the canonicalized,
+       WL-hashed triples back into an rdflib ``Graph`` and serializes
+       with rdflib's native Turtle writer.  This recovers idiomatic
+       Turtle features that pyoxigraph cannot emit:
+
+       - **Inline blank nodes** (``[ … ]``) for singly-referenced
+         blank nodes (Turtle §2.7 [2]_), instead of verbose named
+         ``_:bHASH`` syntax.
+       - **Collection syntax** (``( … )``) for ``rdf:List`` chains
+         (Turtle §2.8 [2]_).
+       - **Prefix filtering**: only prefixes actually used in the
+         graph's IRIs are declared, following the practice of Apache
+         Jena, Eclipse RDF4J, and Raptor.
+
+    All triples from the source graph are preserved — the hybrid step
+    only changes syntactic form, never semantic content.
+
+    Parameters
+    ----------
+    graph : rdflib.Graph
+        An rdflib Graph to serialize.
+
+    Returns
+    -------
+    str
+        Deterministic Turtle string with ``@prefix`` declarations.
+
+    References
+    ----------
+    .. [1] W3C (2024). "RDF Dataset Canonicalization (RDFC-1.0)."
+       W3C Recommendation.  https://www.w3.org/TR/rdf-canon/
+    .. [2] W3C (2014). "RDF 1.1 Turtle — Terse RDF Triple Language."
+       W3C Recommendation.  https://www.w3.org/TR/turtle/
+    """
+    try:
+        import pyoxigraph
+    except ImportError as exc:
+        raise ImportError(
+            "pyoxigraph >= 0.4.0 is required for --deterministic output. "
+            "Install it with: pip install 'pyoxigraph>=0.4.0'"
+        ) from exc
+
+    from rdflib import BNode, Graph, Literal, URIRef
+
+    # ── Phase 1: RDFC-1.0 canonicalization ──────────────────────────
+    nt_data = graph.serialize(format="nt")
+
+    dataset = pyoxigraph.Dataset(pyoxigraph.parse(nt_data, format=pyoxigraph.RdfFormat.N_TRIPLES))
+    dataset.canonicalize(pyoxigraph.CanonicalizationAlgorithm.RDFC_1_0)
+
+    canonical_quads = list(dataset)
+
+    # ── Phase 2: WL structural hashing for diff-stable blank node IDs
+    wl_map = _wl_signatures(canonical_quads)
+
+    def _remap(term):
+        if isinstance(term, pyoxigraph.BlankNode) and term.value in wl_map:
+            return pyoxigraph.BlankNode(wl_map[term.value])
+        return term
+
+    remapped = [pyoxigraph.Triple(_remap(q.subject), q.predicate, _remap(q.object)) for q in canonical_quads]
+
+    # ── Phase 3: Hybrid rdflib re-serialization ─────────────────────
+    # Convert pyoxigraph terms to rdflib terms and populate a clean
+    # Graph that only carries explicitly-bound prefixes.
+    def _to_rdflib(term):
+        """Convert a pyoxigraph term to the equivalent rdflib term."""
+        if isinstance(term, pyoxigraph.NamedNode):
+            return URIRef(term.value)
+        if isinstance(term, pyoxigraph.BlankNode):
+            return BNode(term.value)
+        if isinstance(term, pyoxigraph.Literal):
+            if term.language:
+                return Literal(term.value, lang=term.language)
+            if term.datatype:
+                dt_iri = term.datatype.value
+                # In RDF 1.1, simple literals are syntactic sugar for
+                # xsd:string (Turtle §2.5.1).  Preserve the shorter form
+                # to match the original owlgen output and avoid spurious
+                # diffs on every string literal.
+                if dt_iri == "http://www.w3.org/2001/XMLSchema#string":
+                    return Literal(term.value)
+                return Literal(term.value, datatype=URIRef(dt_iri))
+            return Literal(term.value)
+        return URIRef(str(term))
+
+    result_graph = Graph(bind_namespaces="none")
+    for triple in remapped:
+        result_graph.add((
+            _to_rdflib(triple.subject),
+            _to_rdflib(triple.predicate),
+            _to_rdflib(triple.object),
+        ))
+
+    # Bind only prefixes whose namespace IRI is actually referenced
+    # by at least one subject, predicate, or object in the graph.
+    # This filters out rdflib's ~27 built-in default bindings
+    # (brick, csvw, doap, …) that leak through Graph() even when
+    # the schema never declared them.
+    used_iris: set[str] = set()
+    for s, p, o in result_graph:
+        for term in (s, p, o):
+            if isinstance(term, URIRef):
+                used_iris.add(str(term))
+
+    for pfx, ns in sorted(graph.namespaces()):
+        pfx_s, ns_s = str(pfx), str(ns)
+        if pfx_s and any(iri.startswith(ns_s) for iri in used_iris):
+            result_graph.bind(pfx_s, ns_s)
+
+    return result_graph.serialize(format="turtle")
+
+
+def deterministic_json(obj: object, indent: int = 3) -> str:
+    """Serialize a JSON-compatible object with deterministic ordering.
+
+    Recursively sorts all dict keys *and* list elements to produce
+    stable output across Python versions and process invocations.
+
+    List elements are sorted by their canonical JSON representation
+    (``json.dumps(item, sort_keys=True)``), which handles lists of
+    dicts, strings, and mixed types.
+
+    :param obj: A JSON-serializable object (typically parsed from ``as_json``).
+    :param indent: Number of spaces for indentation.
+    :returns: Deterministic JSON string.
+    """
+    import json
+
+    def _deep_sort(value: object) -> object:
+        if isinstance(value, dict):
+            return {k: _deep_sort(v) for k, v in sorted(value.items())}
+        if isinstance(value, list):
+            sorted_items = [_deep_sort(item) for item in value]
+            try:
+                return sorted(sorted_items, key=lambda x: json.dumps(x, sort_keys=True, ensure_ascii=False))
+            except TypeError:
+                return sorted_items
+        return value
+
+    return json.dumps(_deep_sort(obj), indent=indent, ensure_ascii=False)
+
+
+def well_known_prefix_map() -> dict[str, str]:
+    """Return a mapping from namespace URI to standard prefix name.
+
+    Uses rdflib's curated default namespace bindings as the source of truth.
+    For example, ``https://schema.org/`` maps to ``schema``.
+
+    This allows generators to normalise non-standard prefix aliases
+    (e.g. ``sdo`` for ``https://schema.org/``) to their conventional names.
+    """
+    from rdflib import Graph as RdfGraph
+
+    return {str(ns): str(pfx) for pfx, ns in RdfGraph().namespaces() if str(pfx)}
+
+
 @dataclass
 class Generator(metaclass=abc.ABCMeta):
     """
@@ -139,6 +418,9 @@ class Generator(metaclass=abc.ABCMeta):
     mergeimports: bool | None = True
     """True means merge non-linkml sources into importing package.  False means separate packages"""
 
+    deterministic: bool = False
+    """True means produce stable, reproducible output with sorted keys and canonical blank-node ordering"""
+
     source_file_date: str | None = None
     """Modification date of input source file"""
 
@@ -180,6 +462,10 @@ class Generator(metaclass=abc.ABCMeta):
     stacktrace: bool = False
     """True means print stack trace, false just error message"""
 
+    normalize_prefixes: bool = False
+    """True means normalise non-standard prefix aliases to rdflib's curated default names
+    (e.g. ``sdo`` → ``schema`` for ``https://schema.org/``)."""
+
     include: str | Path | SchemaDefinition | None = None
     """If set, include extra schema outside of the imports mechanism"""
 
@@ -986,6 +1272,26 @@ def decorator(f: Command) -> Command:
                 callback=stacktrace_callback,
             )
         )
+        f.params.append(
+            Option(
+                ("--deterministic/--no-deterministic",),
+                default=False,
+                show_default=True,
+                help="Generate stable, reproducible output with sorted keys and canonical blank-node ordering. "
+                "Supported by OWL, SHACL, JSON-LD, and JSON-LD Context generators. "
+                "Useful when generated artifacts are stored in version control.",
+            )
+        )
+        f.params.append(
+            Option(
+                ("--normalize-prefixes/--no-normalize-prefixes",),
+                default=False,
+                show_default=True,
+                help="Normalise non-standard prefix aliases to rdflib's curated default names "
+                "(e.g. sdo → schema for https://schema.org/). "
+                "Supported by OWL, SHACL, and JSON-LD Context generators.",
+            )
+        )
 
         return f
 
diff --git a/tests/linkml/test_generators/test_deterministic_benchmark.py b/tests/linkml/test_generators/test_deterministic_benchmark.py
new file mode 100644
index 000000000..54d6a62e3
--- /dev/null
+++ b/tests/linkml/test_generators/test_deterministic_benchmark.py
@@ -0,0 +1,368 @@
+"""Benchmark: deterministic Turtle serializer on real-world ontologies.
+
+Evaluates the ``--deterministic`` flag against schema.org (~16 000 triples,
+~800 classes, ~1 400 properties) and the kitchen_sink LinkML schema to
+demonstrate four properties:
+
+1. **Semantic equivalence** — ``rdflib.compare.isomorphic()`` confirms that
+   deterministic and non-deterministic outputs encode the same RDF graph.
+2. **Byte-level stability** — SHA-256 identity across repeated runs proves
+   that deterministic output is truly reproducible.
+3. **Diff quality** — controlled mutations show that small schema changes
+   produce small, focused diffs (high signal-to-noise ratio).
+4. **Performance** — generation time stays within acceptable bounds even
+   on large real-world graphs.
+
+Schema.org tests exercise ``deterministic_turtle()`` directly on a
+pre-existing OWL ontology.  Kitchen_sink tests exercise the full
+``OwlSchemaGenerator`` / ``ShaclGenerator`` pipeline with LinkML schemas.
+
+References
+----------
+- W3C RDFC-1.0: https://www.w3.org/TR/rdf-canon/
+- W3C Turtle 1.1: https://www.w3.org/TR/turtle/
+- schema.org: https://schema.org/docs/developers.html
+"""
+
+import difflib
+import hashlib
+import time
+from pathlib import Path
+
+import pytest
+import yaml
+from rdflib import Graph
+from rdflib.compare import isomorphic
+
+from linkml.generators.owlgen import OwlSchemaGenerator
+from linkml.generators.shaclgen import ShaclGenerator
+from linkml.utils.generator import deterministic_turtle
+
+_has_pyoxigraph = False
+try:
+    import pyoxigraph
+
+    _has_pyoxigraph = hasattr(pyoxigraph, "Dataset")
+except ImportError:
+    pass
+
+pytestmark = pytest.mark.skipif(
+    not _has_pyoxigraph,
+    reason="pyoxigraph >= 0.4.0 required for deterministic benchmarks",
+)
+
+KITCHEN_SINK = str(Path(__file__).parent / "input" / "kitchen_sink.yaml")
+SCHEMA_ORG_URL = "https://schema.org/version/latest/schemaorg-current-https.ttl"
+
+
+def _sha256(text: str) -> str:
+    return hashlib.sha256(text.encode()).hexdigest()
+
+
+def _diff_line_count(a: str, b: str) -> int:
+    """Count lines present in *b* but not in *a* (unified-diff additions)."""
+    al = a.strip().splitlines()
+    bl = b.strip().splitlines()
+    return sum(
+        1
+        for line in difflib.unified_diff(al, bl, lineterm="")
+        if line.startswith("+") and not line.startswith("+++")
+    )
+
+
+# ── Schema.org: direct serializer benchmark ────────────────────────
+
+
+@pytest.fixture(scope="module")
+def schema_org_graph():
+    """Download and parse schema.org as an rdflib Graph.
+
+    Cached for the module so the network fetch only happens once.
+    Skips all dependent tests if the download fails.
+    """
+    try:
+        import urllib.request
+
+        with urllib.request.urlopen(SCHEMA_ORG_URL, timeout=60) as resp:
+            data = resp.read().decode("utf-8")
+    except Exception as exc:
+        pytest.skip(f"Could not fetch schema.org: {exc}")
+
+    g = Graph()
+    g.parse(data=data, format="turtle")
+    return g
+
+
+@pytest.mark.network
+class TestSchemaOrgDeterministicSerializer:
+    """Benchmark ``deterministic_turtle()`` on schema.org OWL ontology."""
+
+    def test_semantic_equivalence(self, schema_org_graph):
+        """Deterministic serialization must be isomorphic to the original graph."""
+        det_ttl = deterministic_turtle(schema_org_graph)
+
+        g_det = Graph()
+        g_det.parse(data=det_ttl, format="turtle")
+
+        assert len(g_det) == len(schema_org_graph), (
+            f"Triple count mismatch: original={len(schema_org_graph)}, "
+            f"deterministic={len(g_det)}"
+        )
+        assert isomorphic(g_det, schema_org_graph), (
+            "Deterministic output is NOT isomorphic to original schema.org graph"
+        )
+
+    def test_byte_stability(self, schema_org_graph):
+        """Two deterministic runs must produce byte-identical output."""
+        run1 = deterministic_turtle(schema_org_graph)
+        run2 = deterministic_turtle(schema_org_graph)
+        assert _sha256(run1) == _sha256(run2), (
+            "Deterministic serializer produced different output across runs"
+        )
+
+    def test_prefix_filtering(self, schema_org_graph):
+        """Only prefixes actually used in the graph should be declared."""
+        det_ttl = deterministic_turtle(schema_org_graph)
+
+        # Extract declared prefixes
+        declared = {}
+        for line in det_ttl.splitlines():
+            if line.startswith("@prefix"):
+                parts = line.split()
+                pfx = parts[1].rstrip(":")
+                ns = parts[2].strip("<>")
+                declared[pfx] = ns
+
+        # Collect all IRIs in the graph
+        from rdflib import URIRef
+
+        used_iris = set()
+        for s, p, o in schema_org_graph:
+            for term in (s, p, o):
+                if isinstance(term, URIRef):
+                    used_iris.add(str(term))
+
+        # Every declared prefix must have at least one IRI using it
+        for pfx, ns in declared.items():
+            assert any(iri.startswith(ns) for iri in used_iris), (
+                f"Prefix '{pfx}:' <{ns}> declared but no IRI uses it"
+            )
+
+    def test_performance(self, schema_org_graph):
+        """Serialization must complete within 60 seconds for ~16K triples."""
+        start = time.time()
+        det_ttl = deterministic_turtle(schema_org_graph)
+        elapsed = time.time() - start
+        triple_count = len(schema_org_graph)
+        throughput = triple_count / elapsed if elapsed > 0 else float("inf")
+
+        # Log for benchmark visibility (shows with pytest -v)
+        print(f"\n  schema.org: {triple_count} triples in {elapsed:.1f}s "
+              f"({throughput:.0f} triples/s)")
+
+        assert elapsed < 60.0, (
+            f"Serialization took {elapsed:.1f}s (limit: 60s) for {triple_count} triples"
+        )
+        assert len(det_ttl) > 1000, "Output suspiciously short"
+
+
+# ── Kitchen_sink: full pipeline benchmark ───────────────────────────
+
+
+def _mutate_kitchen_sink(description_suffix: str = "", add_slot: bool = False) -> str:
+    """Create a mutated copy of kitchen_sink.yaml **in the same directory** and return its path.
+
+    The copy must live alongside the original so that LinkML relative imports
+    (``linkml:types``, ``core``, etc.) resolve correctly.
+
+    Parameters
+    ----------
+    description_suffix
+        Text appended to the first class description found.
+    add_slot
+        If True, adds a synthetic ``benchmark_notes`` slot to the first class.
+    """
+    ks_path = Path(KITCHEN_SINK)
+    schema = yaml.safe_load(ks_path.read_text())
+
+    if description_suffix or add_slot:
+        # Find the first class with a description
+        for cls_name, cls_def in schema.get("classes", {}).items():
+            if isinstance(cls_def, dict) and cls_def.get("description"):
+                if description_suffix:
+                    cls_def["description"] += description_suffix
+                if add_slot:
+                    slots = cls_def.get("slots", [])
+                    slots.append("benchmark_notes")
+                    cls_def["slots"] = slots
+                break
+
+        # Define the synthetic slot if adding one
+        if add_slot:
+            slots_dict = schema.setdefault("slots", {})
+            slots_dict["benchmark_notes"] = {
+                "description": "Synthetic benchmark slot for diff quality testing.",
+                "range": "string",
+            }
+
+    # Write in the same directory so relative imports resolve
+    out_path = ks_path.parent / "_benchmark_mutated_kitchen_sink.yaml"
+    out_path.write_text(
+        yaml.dump(schema, default_flow_style=False, allow_unicode=True),
+        encoding="utf-8",
+    )
+    return str(out_path)
+
+
+@pytest.mark.parametrize(
+    "generator_cls",
+    [OwlSchemaGenerator, ShaclGenerator],
+    ids=["owl", "shacl"],
+)
+class TestKitchenSinkDiffQuality:
+    """Measure diff quality on the kitchen_sink schema with controlled mutations."""
+
+    def test_mutation_description_change(self, generator_cls):
+        """A single description change must produce a small, focused diff.
+
+        Deterministic mode should change only the affected line(s) and their
+        immediate context (e.g. SHACL may repeat descriptions in sh:description).
+        Non-deterministic mode produces a much larger diff due to blank-node
+        and property-ordering instability.
+        """
+        base = generator_cls(KITCHEN_SINK, deterministic=True).serialize()
+        mutated_path = _mutate_kitchen_sink(description_suffix=" (benchmark edit)")
+        try:
+            mutated = generator_cls(mutated_path, deterministic=True).serialize()
+        finally:
+            Path(mutated_path).unlink(missing_ok=True)
+
+        det_diff = _diff_line_count(base, mutated)
+
+        # Non-deterministic baseline for comparison
+        non_base = generator_cls(KITCHEN_SINK, deterministic=False).serialize()
+        non_mutated_path = _mutate_kitchen_sink(description_suffix=" (benchmark edit)")
+        try:
+            non_mutated = generator_cls(non_mutated_path, deterministic=False).serialize()
+        finally:
+            Path(non_mutated_path).unlink(missing_ok=True)
+
+        non_diff = _diff_line_count(non_base, non_mutated)
+
+        # The deterministic diff must be small (description + any SHACL mirrors)
+        assert det_diff <= 20, (
+            f"Deterministic diff too large for a 1-description change: "
+            f"{det_diff} lines (expected ≤20)"
+        )
+        # Signal-to-noise: deterministic must be at least 5× smaller
+        if non_diff > 0:
+            ratio = non_diff / max(det_diff, 1)
+            assert ratio >= 5, (
+                f"Insufficient noise reduction: det={det_diff}, non-det={non_diff}, "
+                f"ratio={ratio:.1f}× (expected ≥5×)"
+            )
+
+        print(f"\n  {generator_cls.__name__} description mutation: "
+              f"det={det_diff} lines, non-det={non_diff} lines, "
+              f"noise reduction={non_diff / max(det_diff, 1):.0f}×")
+
+    def test_mutation_add_slot(self, generator_cls):
+        """Adding a new slot must produce a proportionally small diff.
+
+        A new slot adds ~10-20 triples (label, range, domain, restrictions).
+        The diff should be roughly proportional to the new content, not a
+        full-file rewrite.
+        """
+        base = generator_cls(KITCHEN_SINK, deterministic=True).serialize()
+        mutated_path = _mutate_kitchen_sink(add_slot=True)
+        try:
+            mutated = generator_cls(mutated_path, deterministic=True).serialize()
+        finally:
+            Path(mutated_path).unlink(missing_ok=True)
+
+        det_diff = _diff_line_count(base, mutated)
+
+        # Non-deterministic baseline for comparison
+        non_base = generator_cls(KITCHEN_SINK, deterministic=False).serialize()
+        non_mutated_path = _mutate_kitchen_sink(add_slot=True)
+        try:
+            non_mutated = generator_cls(non_mutated_path, deterministic=False).serialize()
+        finally:
+            Path(non_mutated_path).unlink(missing_ok=True)
+
+        non_diff = _diff_line_count(non_base, non_mutated)
+
+        g_base = Graph()
+        g_base.parse(data=base, format="turtle")
+        g_mut = Graph()
+        g_mut.parse(data=mutated, format="turtle")
+        new_triples = len(g_mut) - len(g_base)
+
+        # Diff should be proportional to new triples (allow 5× margin)
+        assert det_diff <= max(new_triples * 5, 40), (
+            f"Deterministic diff ({det_diff} lines) disproportionate to "
+            f"new triples ({new_triples})"
+        )
+        # Signal-to-noise: deterministic must be at least 5× smaller
+        if non_diff > 0:
+            ratio = non_diff / max(det_diff, 1)
+            assert ratio >= 5, (
+                f"Insufficient noise reduction: det={det_diff}, non-det={non_diff}, "
+                f"ratio={ratio:.1f}× (expected ≥5×)"
+            )
+
+        print(f"\n  {generator_cls.__name__} add-slot mutation: "
+              f"det_diff={det_diff} lines, non-det={non_diff} lines, "
+              f"new_triples={new_triples}, noise reduction={non_diff / max(det_diff, 1):.0f}×")
+
+        print(f"\n  {generator_cls.__name__} add-slot mutation: "
+              f"det_diff={det_diff} lines, new_triples={new_triples}")
+
+
+@pytest.mark.parametrize(
+    "generator_cls",
+    [OwlSchemaGenerator, ShaclGenerator],
+    ids=["owl", "shacl"],
+)
+class TestKitchenSinkEquivalence:
+    """Verify semantic equivalence between deterministic and non-deterministic modes."""
+
+    def test_triple_count_matches(self, generator_cls):
+        """Both modes must produce the same number of triples."""
+        det = generator_cls(KITCHEN_SINK, deterministic=True).serialize()
+        nondet = generator_cls(KITCHEN_SINK, deterministic=False).serialize()
+
+        g_det = Graph()
+        g_det.parse(data=det, format="turtle")
+        g_nondet = Graph()
+        g_nondet.parse(data=nondet, format="turtle")
+
+        assert len(g_det) == len(g_nondet), (
+            f"Triple count mismatch: deterministic={len(g_det)}, "
+            f"non-deterministic={len(g_nondet)}"
+        )
+
+    def test_byte_stability_across_runs(self, generator_cls):
+        """Three deterministic runs must produce identical output."""
+        runs = [
+            generator_cls(KITCHEN_SINK, deterministic=True).serialize()
+            for _ in range(3)
+        ]
+        hashes = [_sha256(r) for r in runs]
+        assert hashes[0] == hashes[1] == hashes[2], (
+            f"Deterministic output varies across runs: {hashes}"
+        )
+
+    def test_non_deterministic_instability(self, generator_cls):
+        """Non-deterministic output should vary across runs (documents the problem).
+
+        This test is advisory — it passes regardless but logs the instability.
+        """
+        runs = [
+            generator_cls(KITCHEN_SINK, deterministic=False).serialize()
+            for _ in range(3)
+        ]
+        hashes = [_sha256(r) for r in runs]
+        identical = hashes[0] == hashes[1] == hashes[2]
+        print(f"\n  {generator_cls.__name__} non-det stable: {identical} "
+              f"(expected: False for Turtle due to bnode/ordering instability)")
diff --git a/tests/linkml/test_generators/test_deterministic_output.py b/tests/linkml/test_generators/test_deterministic_output.py
new file mode 100644
index 000000000..cdf01113e
--- /dev/null
+++ b/tests/linkml/test_generators/test_deterministic_output.py
@@ -0,0 +1,363 @@
+"""Tests for deterministic generator output.
+
+When ``deterministic=True``, generators must produce byte-identical output
+across multiple invocations. This ensures version-controlled artifacts don't
+show spurious diffs from blank-node relabeling or dict-ordering instability.
+
+Generators must also produce **isomorphic** output — the deterministic
+serialization must encode the same RDF graph as non-deterministic mode.
+"""
+
+import json
+import time
+from pathlib import Path
+
+import pytest
+from rdflib import Graph
+from rdflib.compare import isomorphic
+
+from linkml.generators.jsonldcontextgen import ContextGenerator
+from linkml.generators.jsonldgen import JSONLDGenerator
+from linkml.generators.owlgen import OwlSchemaGenerator
+from linkml.generators.shaclgen import ShaclGenerator
+
+# Deterministic Turtle requires pyoxigraph >= 0.4.0 (for Dataset/canonicalize).
+# When an older version is present (e.g. pulled in by morph-kgc), skip these tests.
+_has_pyoxigraph = False
+try:
+    import pyoxigraph
+
+    _has_pyoxigraph = hasattr(pyoxigraph, "Dataset")
+except ImportError:
+    pass
+
+pytestmark = pytest.mark.skipif(not _has_pyoxigraph, reason="pyoxigraph >= 0.4.0 required for deterministic tests")
+
+SCHEMA = str(Path(__file__).parent / "input" / "personinfo.yaml")
+
+
+@pytest.mark.parametrize(
+    "generator_cls,kwargs",
+    [
+        (OwlSchemaGenerator, {}),
+        (ShaclGenerator, {}),
+        (ContextGenerator, {}),
+        (JSONLDGenerator, {}),
+    ],
+    ids=["owl", "shacl", "context", "jsonld"],
+)
+def test_deterministic_output_is_identical_across_runs(generator_cls, kwargs):
+    """Generate output twice with deterministic=True and verify identity."""
+    out1 = generator_cls(SCHEMA, deterministic=True, **kwargs).serialize()
+    out2 = generator_cls(SCHEMA, deterministic=True, **kwargs).serialize()
+    # JSONLDGenerator embeds a generation_date timestamp — normalize it
+    if generator_cls is JSONLDGenerator:
+        import re
+
+        ts_re = re.compile(r"\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}")
+        out1 = ts_re.sub("TIMESTAMP", out1)
+        out2 = ts_re.sub("TIMESTAMP", out2)
+    assert out1 == out2, f"{generator_cls.__name__} produced different output across runs"
+    assert len(out1) > 100, "Output suspiciously short — generator may have failed silently"
+
+
+@pytest.mark.parametrize(
+    "generator_cls",
+    [ContextGenerator, JSONLDGenerator],
+    ids=["context", "jsonld"],
+)
+def test_deterministic_json_has_sorted_keys(generator_cls):
+    """When deterministic=True, JSON dict keys should be sorted at all levels.
+
+    For the ContextGenerator, @context keys use grouped ordering (prefixes
+    before term entries) — each group is sorted, but not globally.
+    """
+    out = generator_cls(SCHEMA, deterministic=True).serialize()
+    parsed = json.loads(out)
+
+    is_context_gen = generator_cls is ContextGenerator
+
+    def _check_sorted_keys(obj, path="root"):
+        if isinstance(obj, dict):
+            keys = list(obj.keys())
+            # Context generator groups @context keys: @-directives, prefixes, terms
+            if is_context_gen and path == "root.@context":
+                at_keys = [k for k in keys if k.startswith("@")]
+                prefix_keys = [k for k in keys if not k.startswith("@") and isinstance(obj[k], str)]
+                term_keys = [k for k in keys if not k.startswith("@") and not isinstance(obj[k], str)]
+                assert at_keys == sorted(at_keys), f"@-keys not sorted: {at_keys}"
+                assert prefix_keys == sorted(prefix_keys), f"Prefix keys not sorted: {prefix_keys}"
+                assert term_keys == sorted(term_keys), f"Term keys not sorted: {term_keys}"
+            else:
+                assert keys == sorted(keys), f"Keys not sorted at {path}: {keys}"
+            for k, v in obj.items():
+                _check_sorted_keys(v, f"{path}.{k}")
+        elif isinstance(obj, list):
+            for i, item in enumerate(obj):
+                _check_sorted_keys(item, f"{path}[{i}]")
+
+    _check_sorted_keys(parsed)
+
+
+@pytest.mark.parametrize(
+    "generator_cls",
+    [ContextGenerator, JSONLDGenerator],
+    ids=["context", "jsonld"],
+)
+def test_deterministic_json_lists_are_sorted(generator_cls):
+    """When deterministic=True, JSON list elements should be sorted."""
+    out = generator_cls(SCHEMA, deterministic=True).serialize()
+    parsed = json.loads(out)
+
+    def _check_sorted_lists(obj, path="root"):
+        if isinstance(obj, dict):
+            for k, v in obj.items():
+                _check_sorted_lists(v, f"{path}.{k}")
+        elif isinstance(obj, list):
+            str_items = [json.dumps(item, sort_keys=True, ensure_ascii=False) for item in obj]
+            assert str_items == sorted(str_items), f"List not sorted at {path}"
+            for i, item in enumerate(obj):
+                _check_sorted_lists(item, f"{path}[{i}]")
+
+    _check_sorted_lists(parsed)
+
+
+@pytest.mark.parametrize(
+    "generator_cls",
+    [OwlSchemaGenerator, ShaclGenerator],
+    ids=["owl", "shacl"],
+)
+def test_deterministic_turtle_preserves_at_prefix(generator_cls):
+    """deterministic_turtle must produce standard @prefix, not SPARQL PREFIX."""
+    out = generator_cls(SCHEMA, deterministic=True).serialize()
+    assert "@prefix" in out, "Output uses non-standard prefix syntax"
+    assert "PREFIX " not in out, "Output uses SPARQL PREFIX instead of Turtle @prefix"
+
+
+def test_deterministic_turtle_performance():
+    """Deterministic OWL generation must complete within 10 seconds for personinfo.
+
+    The Weisfeiler-Lehman approach is O(n log n), so this should easily pass.
+    The previous canon=True approach was exponential and failed this test
+    for graphs above ~250 triples.
+    """
+    start = time.time()
+    out = OwlSchemaGenerator(SCHEMA, deterministic=True).serialize()
+    elapsed = time.time() - start
+    assert elapsed < 10.0, f"Deterministic generation took {elapsed:.1f}s (limit: 10s)"
+    assert len(out) > 100, "Output suspiciously short"
+
+
+def test_shacl_closed_ignored_properties_deterministic():
+    """sh:ignoredProperties in closed shapes must be deterministic.
+
+    ``_build_ignored_properties`` collects inherited slots into a set; without
+    explicit sorting this produces different ``rdf:first``/``rdf:rest`` chains
+    on each run.  With ``deterministic=True`` (and sorted Collection inputs)
+    the output must be byte-identical.
+    """
+    runs = [ShaclGenerator(SCHEMA, deterministic=True, closed=True).serialize() for _ in range(3)]
+    assert runs[0] == runs[1] == runs[2], "sh:ignoredProperties ordering differs across runs"
+    assert "sh:ignoredProperties" in runs[0], "Expected closed shapes with sh:ignoredProperties"
+
+
+def test_shacl_enum_in_deterministic():
+    """sh:in RDF lists for enums must be deterministic.
+
+    ``_build_enum_constraint`` iterates ``enum.permissible_values.items()``
+    (dict iteration order) into a ``Collection``.  Without sorting, the
+    ``rdf:first``/``rdf:rest`` chain varies across runs.
+    """
+    runs = [ShaclGenerator(SCHEMA, deterministic=True).serialize() for _ in range(3)]
+    assert runs[0] == runs[1] == runs[2], "sh:in enum list ordering differs across runs"
+    assert "sh:in" in runs[0], "Expected sh:in constraints for enums"
+
+
+def test_owl_enum_one_of_deterministic():
+    """owl:oneOf RDF lists for enums must be deterministic.
+
+    ``_boolean_expression`` feeds ``pv_uris`` (from ``permissible_values``)
+    into a ``Collection``.  Without sorting, ``owl:oneOf`` list ordering varies.
+    """
+    runs = [OwlSchemaGenerator(SCHEMA, deterministic=True).serialize() for _ in range(3)]
+    assert runs[0] == runs[1] == runs[2], "owl:oneOf enum list ordering differs across runs"
+
+
+KITCHEN_SINK = str(Path(__file__).parent / "input" / "kitchen_sink.yaml")
+
+
+def test_deterministic_large_schema():
+    """End-to-end idempotency on a complex schema (kitchen_sink).
+
+    Exercises many code paths simultaneously: closed shapes, enums, imports,
+    class hierarchies, and mixed ranges.
+    """
+    owl1 = OwlSchemaGenerator(KITCHEN_SINK, deterministic=True).serialize()
+    owl2 = OwlSchemaGenerator(KITCHEN_SINK, deterministic=True).serialize()
+    assert owl1 == owl2, "OWL output differs across runs for kitchen_sink"
+    assert len(owl1) > 500, "kitchen_sink output suspiciously short"
+
+    shacl1 = ShaclGenerator(KITCHEN_SINK, deterministic=True).serialize()
+    shacl2 = ShaclGenerator(KITCHEN_SINK, deterministic=True).serialize()
+    assert shacl1 == shacl2, "SHACL output differs across runs for kitchen_sink"
+    assert len(shacl1) > 500, "kitchen_sink output suspiciously short"
+
+
+def test_deterministic_context_preserves_jsonld_structure():
+    """Deterministic JSON-LD context must preserve conventional structure.
+
+    JSON-LD contexts have a conventional layout:
+    1. ``comments`` block first (metadata)
+    2. ``@context`` block second, with prefixes grouped before term entries
+
+    ``deterministic_json()`` would scramble this by sorting all keys
+    uniformly.  The context generator must use JSON-LD-aware ordering.
+    """
+    out = ContextGenerator(SCHEMA, deterministic=True, metadata=True).serialize()
+    parsed = json.loads(out)
+
+    # Top-level key order: "comments" before "@context"
+    top_keys = list(parsed.keys())
+    assert "comments" in top_keys, "Expected 'comments' block with metadata=True"
+    assert top_keys.index("comments") < top_keys.index("@context"), (
+        f"'comments' should precede '@context', got: {top_keys}"
+    )
+
+    # Inside @context: @-directives, then prefixes (str values), then terms (dict values)
+    ctx = parsed["@context"]
+    ctx_keys = list(ctx.keys())
+
+    at_keys = [k for k in ctx_keys if k.startswith("@")]
+    prefix_keys = [k for k in ctx_keys if not k.startswith("@") and isinstance(ctx[k], str)]
+    term_keys = [k for k in ctx_keys if not k.startswith("@") and not isinstance(ctx[k], str)]
+
+    # Verify grouping: all @-keys before all prefix keys before all term keys
+    last_at = max(ctx_keys.index(k) for k in at_keys) if at_keys else -1
+    first_prefix = min(ctx_keys.index(k) for k in prefix_keys) if prefix_keys else len(ctx_keys)
+    last_prefix = max(ctx_keys.index(k) for k in prefix_keys) if prefix_keys else -1
+    first_term = min(ctx_keys.index(k) for k in term_keys) if term_keys else len(ctx_keys)
+
+    assert last_at < first_prefix, "@-directives must come before prefixes"
+    assert last_prefix < first_term, "Prefixes must come before term entries"
+
+    # Verify each group is sorted internally
+    assert at_keys == sorted(at_keys), f"@-directives not sorted: {at_keys}"
+    assert prefix_keys == sorted(prefix_keys), f"Prefixes not sorted: {prefix_keys}"
+    assert term_keys == sorted(term_keys), f"Term entries not sorted: {term_keys}"
+
+
+def test_non_deterministic_is_default():
+    """Verify that ``deterministic`` defaults to False."""
+    gen = OwlSchemaGenerator(SCHEMA)
+    assert gen.deterministic is False
+
+
+@pytest.mark.xfail(
+    reason=(
+        "Collection sorting (owl:oneOf, sh:in) in deterministic mode intentionally "
+        "reorders RDF list triples for canonical output. The resulting graph is "
+        "semantically equivalent (OWL/SHACL interpret these as unordered sets) but "
+        "not RDF-isomorphic because rdf:first/rdf:rest chains encode ordering."
+    ),
+    strict=True,
+)
+@pytest.mark.parametrize(
+    "generator_cls",
+    [OwlSchemaGenerator, ShaclGenerator],
+    ids=["owl", "shacl"],
+)
+def test_deterministic_turtle_is_isomorphic(generator_cls):
+    """Deterministic output is NOT RDF-isomorphic to non-deterministic output.
+
+    This documents the trade-off identified in linkml/linkml#3295 review:
+    deterministic mode sorts Collection inputs (owl:oneOf, sh:in,
+    sh:ignoredProperties) to produce canonical RDF list ordering.  Since RDF
+    Collections encode order via rdf:first/rdf:rest triples, the sorted graph
+    is structurally different from the insertion-order graph — even though the
+    OWL/SHACL semantics are identical (these Collections represent sets).
+
+    The test is marked xfail(strict=True) so that it:
+    - Documents the known, intentional non-isomorphism
+    - Alerts maintainers if the behaviour changes (strict xfail fails on pass)
+    """
+    out_det = generator_cls(SCHEMA, deterministic=True).serialize()
+    out_nondet = generator_cls(SCHEMA, deterministic=False).serialize()
+
+    g_det = Graph()
+    g_det.parse(data=out_det, format="turtle")
+
+    g_nondet = Graph()
+    g_nondet.parse(data=out_nondet, format="turtle")
+
+    assert len(g_det) == len(g_nondet), (
+        f"Triple count mismatch: deterministic={len(g_det)}, non-deterministic={len(g_nondet)}"
+    )
+    assert isomorphic(g_det, g_nondet), (
+        f"{generator_cls.__name__}: deterministic output is NOT isomorphic "
+        "to non-deterministic output — the serialization changed the graph"
+    )
+
+
+@pytest.mark.parametrize(
+    "generator_cls",
+    [OwlSchemaGenerator, ShaclGenerator],
+    ids=["owl", "shacl"],
+)
+def test_non_deterministic_output_unchanged(generator_cls):
+    """Non-deterministic output must still produce valid RDF.
+
+    Ensures that changes for deterministic mode don't break default behavior.
+    """
+    out = generator_cls(SCHEMA, deterministic=False).serialize()
+    assert len(out) > 100, "Output suspiciously short"
+    g = Graph()
+    g.parse(data=out, format="turtle")
+    assert len(g) > 50, f"Graph has too few triples ({len(g)})"
+
+
+@pytest.mark.parametrize(
+    "generator_cls,kwargs",
+    [
+        (OwlSchemaGenerator, {}),
+        (ShaclGenerator, {}),
+        (ContextGenerator, {}),
+        (JSONLDGenerator, {}),
+    ],
+    ids=["owl", "shacl", "context", "jsonld"],
+)
+def test_non_deterministic_produces_valid_output(generator_cls, kwargs):
+    """All generators must produce valid output in non-deterministic mode."""
+    out = generator_cls(SCHEMA, deterministic=False, **kwargs).serialize()
+    assert len(out) > 100, f"{generator_cls.__name__} output suspiciously short"
+
+
+@pytest.mark.xfail(
+    reason=(
+        "Collection sorting in deterministic mode produces non-isomorphic RDF "
+        "(different rdf:first/rdf:rest triples). See test_deterministic_turtle_is_isomorphic."
+    ),
+    strict=True,
+)
+@pytest.mark.parametrize(
+    "generator_cls",
+    [OwlSchemaGenerator, ShaclGenerator],
+    ids=["owl", "shacl"],
+)
+def test_deterministic_kitchen_sink_isomorphic(generator_cls):
+    """Isomorphism check on the complex kitchen_sink schema.
+
+    Expected to fail for the same reason as test_deterministic_turtle_is_isomorphic:
+    Collection sorting changes the RDF structure while preserving OWL/SHACL semantics.
+    """
+    out_det = generator_cls(KITCHEN_SINK, deterministic=True).serialize()
+    out_nondet = generator_cls(KITCHEN_SINK, deterministic=False).serialize()
+
+    g_det = Graph()
+    g_det.parse(data=out_det, format="turtle")
+
+    g_nondet = Graph()
+    g_nondet.parse(data=out_nondet, format="turtle")
+
+    assert isomorphic(g_det, g_nondet), (
+        f"{generator_cls.__name__}: kitchen_sink deterministic output is NOT isomorphic to non-deterministic output"
+    )