From ec1527e37d53fbd7951509fca9bf4cfaa4814be9 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Mon, 23 Feb 2026 08:41:53 +0000
Subject: [PATCH 1/4] Initial plan


From b918b3651690e20630256f469c07e81ecdb6ae5f Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Mon, 23 Feb 2026 08:56:56 +0000
Subject: [PATCH 2/4] =?UTF-8?q?feat(knowledge=5Fgraphs):=20session=2082=20?=
 =?UTF-8?q?=E2=80=94=20KGAtomEncoder=20+=20KGWitnessBuilder=20(v3.22.36)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: endomorphosis <3405202+endomorphosis@users.noreply.github.com>
---
 .../CHANGELOG_KNOWLEDGE_GRAPHS.md             |  34 +
 .../knowledge_graphs/DEFERRED_FEATURES.md     |  85 +++
 .../knowledge_graphs/IMPROVEMENT_TODO.md      |   1 +
 .../knowledge_graphs/MASTER_STATUS.md         |   8 +-
 ipfs_datasets_py/knowledge_graphs/ROADMAP.md  |   3 +-
 .../knowledge_graphs/query/__init__.py        |   7 +
 .../knowledge_graphs/query/groth16_bridge.py  |  82 +++
 .../query/groth16_kg_witness.py               | 664 ++++++++++++++++++
 .../test_master_status_session80.py           |  10 +-
 .../test_master_status_session81.py           |  21 +-
 .../test_master_status_session82.py           | 604 ++++++++++++++++
 11 files changed, 1509 insertions(+), 10 deletions(-)
 create mode 100644 ipfs_datasets_py/knowledge_graphs/query/groth16_kg_witness.py
 create mode 100644 tests/unit/knowledge_graphs/test_master_status_session82.py

diff --git a/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md b/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
index 3276d81e4..a6fdac944 100644
--- a/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
+++ b/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
@@ -5,6 +5,40 @@ All notable changes to the knowledge_graphs module will be documented in this fi
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [3.22.36] - 2026-02-23
+
+### Added — TDFOL_v1 Witness Builder for Groth16 backend (Session 82) — 50 tests
+
+**`query/groth16_kg_witness.py`** (new module):
+- `KGAtomEncoder(max_length=64)` — normalize arbitrary KG strings to valid
+  single-word TDFOL_v1 atoms required by the Groth16 Rust backend
+  (`processors/groth16_backend`). Core `normalize(s)` + domain-specific encoders:
+  `encode_entity_type`, `encode_name`, `encode_relationship_type`,
+  `encode_entity_id`, `encode_property_key`. Compound atoms:
+  `atom_for_entity`, `atom_for_entity_exists`, `atom_for_path_exists`,
+  `atom_for_entity_property`.
+- `KGWitnessBuilder(circuit_version=1, ruleset_id="TDFOL_v1")` — build complete
+  TDFOL_v1 witness input dicts compatible with `WitnessInput` struct:
+  - `entity_exists(entity_type, name, entity_id, confidence)` → witness proving a
+    named entity exists without revealing its ID
+  - `path_exists(path_ids, rel_types, start_type, end_type)` → witness proving a
+    path exists without revealing node IDs
+  - `entity_property(entity_id, property_key, value_hash)` → witness proving an
+    entity has a property (value hidden behind SHA-256 hash)
+  - `query_answer_count(min_count, actual_count, query_type)` → witness proving
+    result count ≥ threshold
+  - All builders auto-compute `theorem_hash_hex` and `axioms_commitment_hex`
+  - Circuit v2: auto-generates `intermediate_steps` when not provided
+
+**`query/groth16_bridge.py`** (updated):
+- `KGEntityFormula.to_tdfol_atoms(proof_type, entity_type, name_or_end_type,
+  entity_id, confidence) -> dict` (new classmethod) — returns valid TDFOL_v1
+  single-word atoms for `entity_exists` / `path_exists` / `entity_property`
+  proof types using `KGAtomEncoder` internally.
+
+**`query/__init__.py`** (updated):
+- `KGAtomEncoder` and `KGWitnessBuilder` exported + added to `__all__`.
+
 ## [3.22.35] - 2026-02-23
 
 ### Added — 5 new MCP server tools for query/extraction features (Session 81) — 42 tests
diff --git a/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md b/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
index 2ca47e7f8..cc1890c22 100644
--- a/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
+++ b/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
@@ -688,6 +688,91 @@ assert kg.list_snapshots() == ["before_merge"]
 
 ---
 
+## P13: Delivered in v3.22.36 (TDFOL_v1 Witness Builder for Groth16 backend)
+
+### 27. TDFOL_v1 Atom Encoder
+
+**Status:** ✅ Implemented (v3.22.36 — 2026-02-23)
+**Location:** `query/groth16_kg_witness.py` — `KGAtomEncoder`
+**Implementation:**
+- `KGAtomEncoder(max_length=64)` — normalizes arbitrary Knowledge Graph strings
+  (entity types, names, relationship types, entity IDs, property keys) to valid
+  single-word TDFOL_v1 atoms accepted by the Groth16 Rust backend in
+  `processors/groth16_backend`.
+- `normalize(s) -> str` — core normalizer: lower-case, replace invalid chars with
+  `_`, strip leading non-letters, truncate, fallback to `"entity"` for empty input.
+- Domain-specific encoders: `encode_entity_type`, `encode_name`,
+  `encode_relationship_type`, `encode_entity_id`, `encode_property_key`.
+- Compound atoms: `atom_for_entity(type, name)` → `"type_name"`;
+  `atom_for_entity_exists(type, name)` → `"type_name_exists"`;
+  `atom_for_path_exists(start, end)` → `"path_start_to_end_exists"`;
+  `atom_for_entity_property(id, key)` → `"id_has_key"`.
+
+**Example (now works):**
+```python
+from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import KGAtomEncoder
+
+enc = KGAtomEncoder()
+enc.encode_entity_type("Person")          # "person"
+enc.encode_name("Acme Corp")              # "acme_corp"
+enc.encode_name("Alice-Jane O'Brien")     # "alice_jane_o_brien"
+enc.atom_for_entity_exists("Person", "Alice")   # "person_alice_exists"
+enc.atom_for_path_exists("Person", "Org")       # "path_person_to_org_exists"
+```
+
+**Tests:** `tests/unit/knowledge_graphs/test_master_status_session82.py`
+
+---
+
+### 28. TDFOL_v1 Witness Builder
+
+**Status:** ✅ Implemented (v3.22.36 — 2026-02-23)
+**Location:** `query/groth16_kg_witness.py` — `KGWitnessBuilder`
+**Implementation:**
+- `KGWitnessBuilder(circuit_version=1, ruleset_id="TDFOL_v1", encoder=None)` —
+  builds complete TDFOL_v1 witness input dicts compatible with the `WitnessInput`
+  struct in the Groth16 Rust backend (`processors/groth16_backend`).
+- `entity_exists(entity_type, name, entity_id, confidence) -> dict` — proves
+  existence of a named entity without revealing its ID.
+- `path_exists(path_ids, rel_types, start_type, end_type) -> dict` — proves a
+  graph path exists without revealing node IDs.
+- `entity_property(entity_id, property_key, value_hash) -> dict` — proves an
+  entity has a specific property value (via SHA-256 hash).
+- `query_answer_count(min_count, actual_count, query_type) -> dict` — proves the
+  result count meets a threshold.
+- All builders auto-compute `theorem_hash_hex` and `axioms_commitment_hex`.
+- Circuit v2 support: auto-generates `intermediate_steps` when not provided.
+
+**Example (now works):**
+```python
+from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import KGWitnessBuilder
+import json
+
+builder = KGWitnessBuilder()
+witness = builder.entity_exists("Person", "Alice", "eid_001", confidence=0.95)
+# witness["theorem"]        → "person_alice_exists"
+# witness["private_axioms"] → ["eid_001_is_person", "eid_001_has_name_alice", ...]
+# witness["theorem_hash_hex"] → 64-char hex SHA-256
+# witness is JSON-serializable and ready for the Groth16 binary
+
+# For the real Groth16 backend (when binary is compiled):
+# import os; os.environ["IPFS_DATASETS_ENABLE_GROTH16"] = "1"
+# from ipfs_datasets_py.logic.zkp.backends.groth16_ffi import Groth16Backend
+# backend = Groth16Backend()
+# proof_json = backend.prove(json.dumps(witness))
+```
+
+**Also added:** `KGEntityFormula.to_tdfol_atoms(proof_type, entity_type,
+name_or_end_type, entity_id, confidence) -> dict` — returns valid TDFOL_v1
+atoms for entity_exists / path_exists / entity_property proof types, bridging
+the human-readable formula strings with the single-word atom requirement.
+
+**Tests:** `tests/unit/knowledge_graphs/test_master_status_session82.py`
+
+---
+
+---
+
 ## P7: Delivered in v3.22.26 (formerly v4.0+ "GraphQL API support")
 
 ### 19. GraphQL API Support
diff --git a/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md b/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
index ebcc4b8a0..ff3add900 100644
--- a/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
+++ b/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
@@ -30,6 +30,7 @@
 
 ## Session log (most recent first)
 
+- **Session 82 (2026-02-23):** TDFOL_v1 witness builder — `query/groth16_kg_witness.py` (`KGAtomEncoder`: normalize KG strings to valid single-word TDFOL_v1 atoms via `normalize()`/`encode_entity_type()`/`encode_name()`/`encode_relationship_type()`/`encode_entity_id()`/`encode_property_key()`/`atom_for_entity()`/`atom_for_entity_exists()`/`atom_for_path_exists()`/`atom_for_entity_property()`; `KGWitnessBuilder`: build complete TDFOL_v1 witness input dicts for `entity_exists`/`path_exists`/`entity_property`/`query_answer_count` proofs; auto-computes `theorem_hash_hex`+`axioms_commitment_hex`; circuit v2 support); `KGEntityFormula.to_tdfol_atoms()` classmethod added to `groth16_bridge.py`; `query/__init__.py` + `__all__` updated; DEFERRED_FEATURES P13 §27+§28; 80 tests. v3.22.35→v3.22.36.
 - **Session 81 (2026-02-23):** 5 new MCP server tools exposing query/extraction features — `graph_graphql_query.py` (execute GraphQL query via `KnowledgeGraphQLExecutor`) + `graph_visualize.py` (DOT/Mermaid/D3 JSON/ASCII via `KnowledgeGraphVisualizer`) + `graph_complete_suggestions.py` (missing-relationship suggestions via `KnowledgeGraphCompleter`) + `graph_explain.py` (explainable-AI entity/relationship/path/why_connected via `QueryExplainer`) + `graph_provenance_verify.py` (tamper-detection via `ProvenanceChain.verify_chain()`); 5 new `KnowledgeGraphManager` async methods; `graph_tools/__init__.py` + `README.md` updated (11→19 tools); 42 tests. v3.22.34→v3.22.35.
 - **Session 80 (2026-02-23):** ROADMAP Research Areas delivered — `query/completion.py` (`KnowledgeGraphCompleter`; 6 structural completion patterns: triadic closure, common neighbour, symmetric relation, transitive relation, inverse relation, type compatibility; `CompletionSuggestion` + `CompletionReason`; `find_missing_relationships`/`find_isolated_entities`/`compute_completion_score`/`explain_suggestion`) + `query/explanation.py` (`QueryExplainer`; `explain_entity`/`explain_relationship`/`explain_path`/`explain_query_result`/`why_connected`/`entity_importance_score`; `EntityExplanation`/`RelationshipExplanation`/`PathExplanation`/`ExplanationDepth` dataclasses); 8 new symbols in `query/__init__.py`; DEFERRED_FEATURES P12 §25+§26; 52 tests. v3.22.33→v3.22.34.
 - **Session 79 (2026-02-23):** Comprehensive documentation update — `query/README.md` v2.1.0→v3.22.33: added 5 new module rows (graphql.py/federation.py/gnn.py/zkp.py/groth16_bridge.py) + "Advanced Query Features" code examples for each + "Recent Additions" table; stale "Future Enhancements" (listing GraphQL as future) removed. `docs/knowledge_graphs/API_REFERENCE.md` v3.22.22→v3.22.33: new "Advanced Extraction APIs" section (KGDiff/GraphEvents/Snapshots/ProvenanceChain/Visualizer) + new "Advanced Query APIs" section (GraphQL/FederatedKG/GNN/ZKP/Groth16) with full examples; ToC updated. `docs/knowledge_graphs/USER_GUIDE.md` v2.0.0→v3.22.33: §11 "Future Roadmap" (features listed as planned for Q2-Q1 2027) → "Delivered Features (v3.22.x)" (15-row delivery table all ✅ + usage examples; stale Experimental Features block removed). 46 doc integrity tests. v3.22.32→v3.22.33.
diff --git a/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md b/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
index 7f3dd9f1c..ad7cb21b7 100644
--- a/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
+++ b/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
@@ -1,9 +1,9 @@
 # Knowledge Graphs Module - Master Status Document
 
-**Version:** 3.22.35  
+**Version:** 3.22.36  
 **Status:** ✅ Production Ready  
-**Last Updated:** 2026-02-23 (session 81)  
-**Last Major Release:** v3.22.35 (session 81: 5 new MCP server tools for query/extraction features — `graph_graphql_query` / `graph_visualize` / `graph_complete_suggestions` / `graph_explain` / `graph_provenance_verify`; 5 new `KnowledgeGraphManager` methods; `graph_tools/__init__.py` + `README.md` updated; 42 tests)
+**Last Updated:** 2026-02-23 (session 82)  
+**Last Major Release:** v3.22.36 (session 82: `KGAtomEncoder` + `KGWitnessBuilder` in `query/groth16_kg_witness.py` — TDFOL_v1 atom normalization and witness input construction for the Groth16 Rust backend; `KGEntityFormula.to_tdfol_atoms()` added to `groth16_bridge.py`; `query/__init__.py` exports updated; 50 tests)
 
 ---
 
@@ -19,7 +19,7 @@
 | **Folder Refactoring** | ✅ Complete | All root-level modules moved to subpackages (2026-02-20) |
 | **New MCP Tools** | ✅ Complete | graph_srl_extract, graph_ontology_materialize, graph_distributed_execute, graph_graphql_query, graph_visualize, graph_complete_suggestions, graph_explain, graph_provenance_verify |
 | **Test Coverage** | **99.99% (1 missed line)** | Session 58: 3,759 pass, 2 skip, **0 fail** (full dep env); 1 missed line |
-| **Documentation** | ✅ Up to Date | Reflects v3.22.35 structure |
+| **Documentation** | ✅ Up to Date | Reflects v3.22.36 structure |
 | **Known Issues** | None | 0 failures; all skips intentional (libipld/spaCy absent when not installed) |
 | **Next Milestone** | v4.0 (2027+) | 1 missed line: `_entity_helpers.py:117` (intentional defensive guard) — 99.99% coverage |
 
diff --git a/ipfs_datasets_py/knowledge_graphs/ROADMAP.md b/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
index 57d97b2b6..db2bddc88 100644
--- a/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
+++ b/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
@@ -1,7 +1,7 @@
 # Knowledge Graphs - Development Roadmap
 
 **Last Updated:** 2026-02-23  
-**Current Version:** 3.22.35  
+**Current Version:** 3.22.36  
 **Status:** Production Ready (99.99% test coverage)
 
 ---
@@ -438,6 +438,7 @@ We follow [Semantic Versioning](https://semver.org/):
 | 3.22.29 | 2026-02-23 | ✅ Released | Deferred v4.0+ blockchain-style provenance chain: extraction/provenance.py (ProvenanceChain; ProvenanceEvent with SHA-256 CID; ProvenanceEventType 7 types; verify_chain() tamper detection; to_jsonl/from_jsonl); KnowledgeGraph.enable_provenance/disable_provenance/.provenance; auto-recording in add_entity/add_relationship; DEFERRED_FEATURES P10 §22; 45 tests (session75) |
 | 3.22.30 | 2026-02-23 | ✅ Released | Deferred v4.0+ GNN integration (query/gnn.py: GraphNeuralNetworkAdapter with GRAPH_CONV/SAGE/ATTENTION; node embeddings, link prediction, similar-entity search, numpy/PyTorch export) + ZKP support (query/zkp.py: KGZKProver/KGZKVerifier; 4 proof types; SHA-256 commitments; nullifier replay protection); DEFERRED_FEATURES P11 §23+§24; 55 tests (session76) |
 | 3.22.35 | 2026-02-23 | ✅ Released | 5 new MCP tools for query/extraction features (graph_graphql_query, graph_visualize, graph_complete_suggestions, graph_explain, graph_provenance_verify); 5 new KnowledgeGraphManager methods; graph_tools/__init__.py+README.md updated; 42 tests (session81) |
+| 3.22.36 | 2026-02-23 | ✅ Released | TDFOL_v1 witness builder: `query/groth16_kg_witness.py` (`KGAtomEncoder` normalizes KG strings to valid single-word TDFOL_v1 atoms; `KGWitnessBuilder` builds complete witness input dicts for entity_exists/path_exists/entity_property/query_answer_count proofs compatible with Groth16 Rust backend); `KGEntityFormula.to_tdfol_atoms()` classmethod added; `query/__init__.py` exports updated; 50 tests (session82) |
 | 3.22.34 | 2026-02-23 | ✅ Released | ROADMAP Research Areas: Knowledge Graph Completion (query/completion.py: KnowledgeGraphCompleter; 6 structural patterns: triadic closure/common neighbour/symmetric/transitive/inverse/type-compat; CompletionSuggestion+CompletionReason) + Explainable AI (query/explanation.py: QueryExplainer; explain_entity/relationship/path/why_connected/entity_importance_score; SURFACE/STANDARD/DEEP depth; EntityExplanation/RelationshipExplanation/PathExplanation); DEFERRED_FEATURES P12 §25+§26; 52 tests (session80) |
 | 3.22.33 | 2026-02-23 | ✅ Released | Comprehensive documentation update: query/README.md v2.1.0→v3.22.33 (5 new module sections + Advanced Query Features + Recent Additions table); docs/knowledge_graphs/API_REFERENCE.md v3.22.22→v3.22.33 (Advanced Extraction APIs + Advanced Query APIs sections with examples); docs/knowledge_graphs/USER_GUIDE.md v2.0.0→v3.22.33 (§11 Future Roadmap→Delivered Features table with 15 items all ✅); 46 doc tests (session79) |
 | 3.22.32 | 2026-02-23 | ✅ Released | Groth16 Bridge: query/groth16_bridge.py (groth16_binary_available+groth16_enabled+Groth16KGConfig+KGEntityFormula+create_groth16_kg_prover+create_groth16_kg_verifier+describe_groth16_status); direct KG↔TDFOL_v1 theorem/axiom mapping; binary availability probe; 7 query/__init__.py exports; DEFERRED_FEATURES §24 Direct Groth16 Bridge subsection; 50 tests (session78) |
diff --git a/ipfs_datasets_py/knowledge_graphs/query/__init__.py b/ipfs_datasets_py/knowledge_graphs/query/__init__.py
index a5460d883..480ab9cb6 100644
--- a/ipfs_datasets_py/knowledge_graphs/query/__init__.py
+++ b/ipfs_datasets_py/knowledge_graphs/query/__init__.py
@@ -131,6 +131,10 @@
     create_groth16_kg_verifier,
     describe_groth16_status,
 )
+from .groth16_kg_witness import (
+    KGAtomEncoder,
+    KGWitnessBuilder,
+)
 from .completion import (
     KnowledgeGraphCompleter,
     CompletionSuggestion,
@@ -200,6 +204,9 @@
     'create_groth16_kg_prover',
     'create_groth16_kg_verifier',
     'describe_groth16_status',
+    # Groth16 KG Witness Builder (v3.22.36 — TDFOL_v1 witness construction)
+    'KGAtomEncoder',
+    'KGWitnessBuilder',
     # Knowledge Graph Completion (v3.22.34 — Research Area)
     'KnowledgeGraphCompleter',
     'CompletionSuggestion',
diff --git a/ipfs_datasets_py/knowledge_graphs/query/groth16_bridge.py b/ipfs_datasets_py/knowledge_graphs/query/groth16_bridge.py
index 5fb94fb6b..82e3545d2 100644
--- a/ipfs_datasets_py/knowledge_graphs/query/groth16_bridge.py
+++ b/ipfs_datasets_py/knowledge_graphs/query/groth16_bridge.py
@@ -175,6 +175,13 @@ class KGEntityFormula:
     be valid Prolog or any specific formal language — the TDFOL_v1 circuit
     hashes the strings to derive commitments.
 
+    .. note::
+
+        The ``to_tdfol_atoms()`` class method (added in v3.22.36) returns
+        *valid single-word TDFOL_v1 atoms* from the same concept mappings, for
+        use with the Rust Groth16 binary.  For full witness construction use
+        :class:`~ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness.KGWitnessBuilder`.
+
     Example::
 
         theorem = KGEntityFormula.entity_exists_theorem("Person", "Alice")
@@ -182,6 +189,11 @@ class KGEntityFormula:
 
         axioms = KGEntityFormula.entity_exists_axioms("e-001", "Person", "Alice", 0.95)
         # ["e-001 is person", "e-001 has name alice", "e-001 confidence 0.95"]
+
+        # Single-word atom versions (v3.22.36):
+        atoms = KGEntityFormula.to_tdfol_atoms("entity_exists", "Person", "Alice", "e-001")
+        # atoms["theorem"] == "person_alice_exists"
+        # atoms["axioms"][0] == "e_001_is_person"
     """
 
     @staticmethod
@@ -259,6 +271,76 @@ def property_axioms(
             f"property {pk} committed {value_hash[:16]}",
         ]
 
+    @classmethod
+    def to_tdfol_atoms(
+        cls,
+        proof_type: str,
+        entity_type: str,
+        name_or_end_type: str,
+        entity_id: str = "",
+        confidence: float = 1.0,
+    ) -> Dict[str, Any]:
+        """Return TDFOL_v1 *single-word* atoms for a KG proof concept.
+
+        Unlike the other methods which return human-readable strings, this
+        method uses :class:`~ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness.KGAtomEncoder`
+        to produce valid TDFOL_v1 atoms suitable for direct submission to the
+        Groth16 Rust binary.
+
+        Args:
+            proof_type: One of ``"entity_exists"``, ``"path_exists"``,
+                ``"entity_property"``.
+            entity_type: Entity type (or path start-type for path proofs).
+            name_or_end_type: Entity name, or path end-type for path proofs.
+            entity_id: Private entity ID (encoded as axiom); optional for
+                path proofs.
+            confidence: Confidence score [0, 1].
+
+        Returns:
+            Dict with keys ``"proof_type"``, ``"theorem"`` (atom), and
+            ``"axioms"`` (list of atoms / implications).
+
+        Added in v3.22.36.
+        """
+        from .groth16_kg_witness import KGAtomEncoder
+        enc = KGAtomEncoder()
+
+        if proof_type == "entity_exists":
+            theorem = enc.atom_for_entity_exists(entity_type, name_or_end_type)
+            type_atom = enc.encode_entity_type(entity_type)
+            name_atom = enc.encode_name(name_or_end_type)
+            eid_atom = enc.encode_entity_id(entity_id) if entity_id else "unknown_entity"
+            conf_int = max(0, min(9999, int(round(confidence * 1000))))
+            axioms = [
+                f"{eid_atom}_is_{type_atom}",
+                f"{eid_atom}_has_name_{name_atom}",
+                f"conf_{conf_int:04d}",
+                f"{type_atom}_{name_atom}_exists",
+            ]
+        elif proof_type == "path_exists":
+            theorem = enc.atom_for_path_exists(entity_type, name_or_end_type)
+            axioms = [
+                f"path_from_{enc.encode_entity_type(entity_type)}",
+                f"path_to_{enc.encode_entity_type(name_or_end_type)}",
+            ]
+        elif proof_type == "entity_property":
+            theorem = enc.atom_for_entity_property(entity_id or entity_type, name_or_end_type)
+            eid_atom = enc.encode_entity_id(entity_id or entity_type)
+            pk_atom = enc.encode_property_key(name_or_end_type)
+            axioms = [
+                f"{eid_atom}_property_{pk_atom}",
+                f"{eid_atom}_has_{pk_atom}",
+            ]
+        else:
+            theorem = enc.normalize(proof_type) or "unknown_proof"
+            axioms = []
+
+        return {
+            "proof_type": proof_type,
+            "theorem": theorem,
+            "axioms": axioms,
+        }
+
 
 # ---------------------------------------------------------------------------
 # Prover / verifier factories
diff --git a/ipfs_datasets_py/knowledge_graphs/query/groth16_kg_witness.py b/ipfs_datasets_py/knowledge_graphs/query/groth16_kg_witness.py
new file mode 100644
index 000000000..a7e346db0
--- /dev/null
+++ b/ipfs_datasets_py/knowledge_graphs/query/groth16_kg_witness.py
@@ -0,0 +1,664 @@
+"""
+TDFOL_v1 Witness Builder for Knowledge Graph Zero-Knowledge Proofs.
+
+Bridges the KG domain (entity types, names, IDs, relationships) to the
+TDFOL_v1 circuit expected by the Groth16 Rust backend in
+``processors/groth16_backend``.
+
+The Rust backend requires:
+- **theorem**: a single TDFOL_v1 atom (ASCII-letter start, alphanumeric + ``_``).
+- **private_axioms**: list of atoms or implications ``"atom -> atom"``.
+- **intermediate_steps** (circuit v2 only): non-empty list of atoms forming a
+  derivation trace.
+- **axioms_commitment_hex**: 64-hex-char SHA-256 commitment over axioms.
+- **theorem_hash_hex**: 64-hex-char SHA-256 hash of the theorem atom.
+
+This module provides:
+
+- :class:`KGAtomEncoder` — normalize arbitrary KG strings (entity types, names,
+  relationship types, entity IDs) into valid single-word TDFOL_v1 atoms.
+- :class:`KGWitnessBuilder` — build complete TDFOL_v1 witness input dicts ready
+  for submission to the Groth16 binary.
+
+Quick start
+-----------
+
+.. code-block:: python
+
+    from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+        KGAtomEncoder,
+        KGWitnessBuilder,
+    )
+
+    enc = KGAtomEncoder()
+
+    # Encode KG concepts to valid TDFOL_v1 atoms
+    print(enc.encode_entity_type("Person"))         # "person"
+    print(enc.encode_name("Acme Corp"))             # "acme_corp"
+    print(enc.encode_name("Alice-Jane O'Brien"))    # "alice_jane_o_brien"
+
+    # Build a witness for entity_exists proof
+    builder = KGWitnessBuilder()
+    witness = builder.entity_exists(
+        entity_type="Person",
+        name="Alice",
+        entity_id="eid_001",
+        confidence=0.95,
+    )
+    # witness["theorem"]        → "person_alice_exists"
+    # witness["private_axioms"] → ["eid_001_is_person", "eid_001_has_name_alice", ...]
+
+    # Build a witness for path_exists proof
+    witness = builder.path_exists(
+        path_ids=["eid_001", "eid_002", "eid_003"],
+        rel_types=["knows", "works_at"],
+        start_type="Person",
+        end_type="Organization",
+    )
+
+    # Build a witness for entity_property proof
+    import hashlib
+    value_hash = hashlib.sha256(b"30").hexdigest()
+    witness = builder.entity_property(
+        entity_id="eid_001",
+        property_key="age",
+        value_hash=value_hash,
+    )
+
+Integration with the Groth16 backend
+-------------------------------------
+
+.. code-block:: python
+
+    import os, json
+    os.environ["IPFS_DATASETS_ENABLE_GROTH16"] = "1"
+
+    from ipfs_datasets_py.logic.zkp.backends.groth16_ffi import Groth16Backend
+    from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import KGWitnessBuilder
+
+    backend = Groth16Backend()
+    builder = KGWitnessBuilder(circuit_version=1)
+    witness = builder.entity_exists("Person", "Alice", "eid_001", 0.95)
+    proof_json = backend.prove(json.dumps(witness))
+"""
+
+from __future__ import annotations
+
+import hashlib
+import json
+import re
+from typing import Any, Dict, List, Optional
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+def _sha256_hex(data: str) -> str:
+    """Return 64-char hex SHA-256 of *data*."""
+    return hashlib.sha256(data.encode("utf-8")).hexdigest()
+
+
+def _is_tdfol_atom(s: str) -> bool:
+    """Return *True* if *s* is a valid TDFOL_v1 atom.
+
+    A TDFOL_v1 atom starts with an ASCII letter and contains only
+    alphanumeric characters or underscores (no spaces, hyphens, dots, …).
+    """
+    if not s:
+        return False
+    if not s[0].isascii() or not s[0].isalpha():
+        return False
+    return all(c.isascii() and (c.isalnum() or c == "_") for c in s)
+
+
+# ---------------------------------------------------------------------------
+# KGAtomEncoder
+# ---------------------------------------------------------------------------
+
+class KGAtomEncoder:
+    """Normalize Knowledge Graph strings to valid TDFOL_v1 atoms.
+
+    TDFOL_v1 atoms must:
+    - Start with an ASCII letter.
+    - Contain only ASCII alphanumeric characters or underscores.
+    - Be non-empty.
+
+    This encoder handles entity types, entity names, relationship types,
+    entity IDs, and property keys — converting any input string into a
+    compliant atom.
+
+    Args:
+        max_length: Maximum atom length (default 64).  Atoms are truncated
+            (never left-padded) when they exceed this limit.
+
+    Example::
+
+        enc = KGAtomEncoder()
+
+        enc.encode_entity_type("Person")          # "person"
+        enc.encode_entity_type("AIModel")         # "aimodel"
+        enc.encode_name("Alice-Jane O'Brien")     # "alice_jane_o_brien"
+        enc.encode_name("Acme Corp (Ltd)")        # "acme_corp__ltd_"
+        enc.encode_relationship_type("works_at")  # "works_at"
+        enc.encode_entity_id("eid-abc/123")       # "eid_abc_123"
+        enc.atom_for_entity("Person", "Alice")    # "person_alice"
+    """
+
+    def __init__(self, max_length: int = 64) -> None:
+        self.max_length = max_length
+
+    # ------------------------------------------------------------------
+    # Core normalizer
+    # ------------------------------------------------------------------
+
+    def normalize(self, s: str) -> str:
+        """Normalize an arbitrary string to a valid TDFOL_v1 atom.
+
+        Steps:
+        1. Strip leading/trailing whitespace.
+        2. Lower-case everything.
+        3. Replace any non-(alphanumeric|underscore) run with ``_``.
+        4. Remove leading underscores and digits (atom must start with a letter).
+        5. Truncate to ``max_length``.
+        6. Fall back to ``"entity"`` if the result is empty.
+
+        Args:
+            s: Input string (any content).
+
+        Returns:
+            A non-empty valid TDFOL_v1 atom string.
+        """
+        s = s.strip().lower()
+        # Replace runs of invalid chars with single underscore
+        s = re.sub(r"[^a-z0-9_]+", "_", s)
+        # Remove leading chars that are not ASCII letters
+        s = s.lstrip("_0123456789")
+        # Truncate
+        s = s[:self.max_length]
+        # Remove trailing underscores for neatness
+        s = s.rstrip("_")
+        return s if s else "entity"
+
+    # ------------------------------------------------------------------
+    # Domain-specific encoders
+    # ------------------------------------------------------------------
+
+    def encode_entity_type(self, entity_type: str) -> str:
+        """Encode an entity type string to a TDFOL_v1 atom.
+
+        Args:
+            entity_type: e.g. ``"Person"``, ``"AIModel"``, ``"legal_document"``.
+
+        Returns:
+            Normalized atom, e.g. ``"person"``, ``"aimodel"``, ``"legal_document"``.
+        """
+        return self.normalize(entity_type)
+
+    def encode_name(self, name: str) -> str:
+        """Encode an entity name string to a TDFOL_v1 atom.
+
+        Args:
+            name: e.g. ``"Alice"``, ``"Acme Corp (Ltd.)"``
+
+        Returns:
+            Normalized atom, e.g. ``"alice"``, ``"acme_corp__ltd_"``.
+        """
+        return self.normalize(name)
+
+    def encode_relationship_type(self, rel_type: str) -> str:
+        """Encode a relationship type string to a TDFOL_v1 atom.
+
+        Args:
+            rel_type: e.g. ``"works_at"``, ``"KNOWS"``, ``"related-to"``.
+
+        Returns:
+            Normalized atom, e.g. ``"works_at"``, ``"knows"``, ``"related_to"``.
+        """
+        return self.normalize(rel_type)
+
+    def encode_entity_id(self, entity_id: str) -> str:
+        """Encode an entity ID to a TDFOL_v1 atom.
+
+        Entity IDs often contain hyphens or slashes (e.g. UUID format).
+        This encoder preserves as much of the original as possible.
+
+        Args:
+            entity_id: e.g. ``"eid-abc-123"``, ``"entity/456"``.
+
+        Returns:
+            Normalized atom, e.g. ``"eid_abc_123"``, ``"entity_456"``.
+        """
+        return self.normalize(entity_id)
+
+    def encode_property_key(self, property_key: str) -> str:
+        """Encode a property key to a TDFOL_v1 atom.
+
+        Args:
+            property_key: e.g. ``"age"``, ``"first-name"``, ``"confidence_score"``.
+
+        Returns:
+            Normalized atom, e.g. ``"age"``, ``"first_name"``, ``"confidence_score"``.
+        """
+        return self.normalize(property_key)
+
+    # ------------------------------------------------------------------
+    # Compound atoms
+    # ------------------------------------------------------------------
+
+    def atom_for_entity(self, entity_type: str, name: str) -> str:
+        """Return a compound atom combining entity type and name.
+
+        The result is ``"{type}_{name}"``, truncated to ``max_length``.
+
+        Args:
+            entity_type: Entity type string.
+            name: Entity name string.
+
+        Returns:
+            Compound atom, e.g. ``"person_alice"``.
+        """
+        t = self.encode_entity_type(entity_type)
+        n = self.encode_name(name)
+        combined = f"{t}_{n}"
+        return combined[:self.max_length]
+
+    def atom_for_entity_exists(self, entity_type: str, name: str) -> str:
+        """Return the canonical theorem atom for an entity-exists proof.
+
+        Args:
+            entity_type: Entity type string.
+            name: Entity name string.
+
+        Returns:
+            Atom, e.g. ``"person_alice_exists"``.
+        """
+        base = self.atom_for_entity(entity_type, name)
+        suffix = "_exists"
+        return (base[:self.max_length - len(suffix)] + suffix)
+
+    def atom_for_path_exists(self, start_type: str, end_type: str) -> str:
+        """Return the canonical theorem atom for a path-exists proof.
+
+        Args:
+            start_type: Start entity type string.
+            end_type: End entity type string.
+
+        Returns:
+            Atom, e.g. ``"path_person_to_organization_exists"``.
+        """
+        s = self.encode_entity_type(start_type)
+        e = self.encode_entity_type(end_type)
+        raw = f"path_{s}_to_{e}_exists"
+        return raw[:self.max_length]
+
+    def atom_for_entity_property(self, entity_id: str, property_key: str) -> str:
+        """Return the canonical theorem atom for an entity-property proof.
+
+        Args:
+            entity_id: Entity ID string.
+            property_key: Property name string.
+
+        Returns:
+            Atom, e.g. ``"eid_001_has_age"``.
+        """
+        eid = self.encode_entity_id(entity_id)
+        pk = self.encode_property_key(property_key)
+        raw = f"{eid}_has_{pk}"
+        return raw[:self.max_length]
+
+
+# ---------------------------------------------------------------------------
+# Axiom commitment helper (mirrors Rust's commit_axioms_v1 for v1 circuit)
+# ---------------------------------------------------------------------------
+
+def _commit_axioms_v1(private_axioms: List[str]) -> str:
+    """Compute the v1 axioms commitment as a 64-char hex SHA-256 string.
+
+    The v1 circuit simply hashes the JSON-encoded sorted list of axioms.
+    This mirrors the logic in :mod:`ipfs_datasets_py.logic.zkp.canonicalization`.
+
+    Args:
+        private_axioms: List of TDFOL_v1 axiom strings.
+
+    Returns:
+        64-character lowercase hex string.
+    """
+    # Use the same canonicalization as the Python logic layer (SHA-256 of
+    # JSON-encoded sorted axiom list).
+    payload = json.dumps(sorted(private_axioms), separators=(",", ":"))
+    return _sha256_hex(payload)
+
+
+# ---------------------------------------------------------------------------
+# KGWitnessBuilder
+# ---------------------------------------------------------------------------
+
+class KGWitnessBuilder:
+    """Build TDFOL_v1 witness input dicts for Knowledge Graph ZK proofs.
+
+    Produces dictionaries compatible with the ``WitnessInput`` struct
+    in the Groth16 Rust backend:
+
+    .. code-block:: json
+
+        {
+            "private_axioms": ["..."],
+            "theorem": "...",
+            "intermediate_steps": ["..."],
+            "axioms_commitment_hex": "64-char hex",
+            "theorem_hash_hex": "64-char hex",
+            "circuit_version": 1,
+            "ruleset_id": "TDFOL_v1"
+        }
+
+    Args:
+        circuit_version: TDFOL_v1 circuit version (1 or 2).  Circuit v2
+            requires non-empty ``intermediate_steps``.
+        ruleset_id: Ruleset identifier (default ``"TDFOL_v1"``).
+        encoder: Optional :class:`KGAtomEncoder` instance.  A default one
+            is created when not provided.
+
+    Example::
+
+        builder = KGWitnessBuilder()
+        witness = builder.entity_exists("Person", "Alice", "eid_001", 0.95)
+        # witness["theorem"] == "person_alice_exists"
+    """
+
+    def __init__(
+        self,
+        circuit_version: int = 1,
+        ruleset_id: str = "TDFOL_v1",
+        encoder: Optional[KGAtomEncoder] = None,
+    ) -> None:
+        self.circuit_version = circuit_version
+        self.ruleset_id = ruleset_id
+        self.encoder = encoder or KGAtomEncoder()
+
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+
+    def _build(
+        self,
+        theorem: str,
+        private_axioms: List[str],
+        intermediate_steps: Optional[List[str]] = None,
+    ) -> Dict[str, Any]:
+        """Assemble a complete witness dict.
+
+        Validates that *theorem* and all *private_axioms* are valid TDFOL_v1
+        atoms (or valid implications for axioms).  Computes
+        ``theorem_hash_hex`` and ``axioms_commitment_hex`` automatically.
+
+        Args:
+            theorem: TDFOL_v1 theorem atom.
+            private_axioms: List of TDFOL_v1 axiom atoms or implications.
+            intermediate_steps: Derivation trace atoms for circuit v2.
+
+        Returns:
+            A witness dict ready to be JSON-serialized and passed to the
+            Groth16 binary.
+        """
+        if not _is_tdfol_atom(theorem):
+            raise ValueError(
+                f"theorem must be a valid TDFOL_v1 atom, got: {theorem!r}"
+            )
+        for axiom in private_axioms:
+            # Axioms may be "atom" or "atom -> atom"
+            if " -> " in axiom:
+                parts = axiom.split(" -> ", 1)
+                if not _is_tdfol_atom(parts[0]) or not _is_tdfol_atom(parts[1]):
+                    raise ValueError(
+                        f"axiom implication contains invalid atoms: {axiom!r}"
+                    )
+            elif not _is_tdfol_atom(axiom):
+                raise ValueError(
+                    f"axiom must be a valid TDFOL_v1 atom or implication, got: {axiom!r}"
+                )
+
+        steps: List[str] = intermediate_steps or []
+        if self.circuit_version == 2 and not steps:
+            # Auto-derive a minimal trace: just the theorem itself
+            steps = [theorem]
+
+        theorem_hash = _sha256_hex(theorem)
+        axioms_commitment = _commit_axioms_v1(private_axioms)
+
+        return {
+            "private_axioms": private_axioms,
+            "theorem": theorem,
+            "intermediate_steps": steps,
+            "axioms_commitment_hex": axioms_commitment,
+            "theorem_hash_hex": theorem_hash,
+            "circuit_version": self.circuit_version,
+            "ruleset_id": self.ruleset_id,
+        }
+
+    # ------------------------------------------------------------------
+    # Public proof-type builders
+    # ------------------------------------------------------------------
+
+    def entity_exists(
+        self,
+        entity_type: str,
+        name: str,
+        entity_id: str,
+        confidence: float = 1.0,
+        intermediate_steps: Optional[List[str]] = None,
+    ) -> Dict[str, Any]:
+        """Build a witness proving that an entity with *entity_type* and *name* exists.
+
+        The entity ID and confidence are encoded as private axioms; the theorem
+        is the public claim.
+
+        Args:
+            entity_type: Entity type (e.g. ``"Person"``).
+            name: Entity name (e.g. ``"Alice"``).
+            entity_id: Private entity ID (not revealed in the theorem).
+            confidence: Confidence score in [0.0, 1.0].
+            intermediate_steps: Optional derivation trace (required for v2).
+
+        Returns:
+            Witness input dict.
+
+        Example::
+
+            builder = KGWitnessBuilder()
+            w = builder.entity_exists("Person", "Alice", "eid_001", 0.95)
+            assert w["theorem"] == "person_alice_exists"
+        """
+        enc = self.encoder
+        type_atom = enc.encode_entity_type(entity_type)
+        name_atom = enc.encode_name(name)
+        eid_atom = enc.encode_entity_id(entity_id)
+        theorem = enc.atom_for_entity_exists(entity_type, name)
+
+        # Confidence encoded as a 4-digit fixed-point atom: e.g. "conf_0950"
+        conf_int = max(0, min(9999, int(round(confidence * 1000))))
+        conf_atom = f"conf_{conf_int:04d}"
+        # Ensure conf_atom is valid (starts with letter — "conf" does)
+
+        # Private axioms: entity ID is the witness
+        axioms = [
+            f"{eid_atom}_is_{type_atom}",
+            f"{eid_atom}_has_name_{name_atom}",
+            conf_atom,
+            f"{type_atom}_{name_atom}_exists",
+        ]
+
+        return self._build(theorem, axioms, intermediate_steps)
+
+    def path_exists(
+        self,
+        path_ids: List[str],
+        rel_types: Optional[List[str]] = None,
+        start_type: str = "entity",
+        end_type: str = "entity",
+        intermediate_steps: Optional[List[str]] = None,
+    ) -> Dict[str, Any]:
+        """Build a witness proving that a path between entity types exists.
+
+        The actual node IDs along the path are private axioms.
+
+        Args:
+            path_ids: Ordered list of entity IDs forming the path.
+            rel_types: Optional list of relationship types between consecutive
+                nodes (must have ``len(path_ids) - 1`` entries).
+            start_type: Type of the starting entity.
+            end_type: Type of the ending entity.
+            intermediate_steps: Optional derivation trace (required for v2).
+
+        Returns:
+            Witness input dict.
+
+        Raises:
+            ValueError: When *path_ids* is empty.
+
+        Example::
+
+            builder = KGWitnessBuilder()
+            w = builder.path_exists(
+                path_ids=["eid_001", "eid_002"],
+                rel_types=["knows"],
+                start_type="Person",
+                end_type="Person",
+            )
+            assert w["theorem"] == "path_person_to_person_exists"
+        """
+        if not path_ids:
+            raise ValueError("path_ids must be non-empty")
+
+        enc = self.encoder
+        theorem = enc.atom_for_path_exists(start_type, end_type)
+
+        # Encode path length as an atom: "path_len_N"
+        length_atom = f"path_len_{len(path_ids)}"
+
+        axioms: List[str] = [length_atom]
+        for i, nid in enumerate(path_ids):
+            nid_atom = enc.encode_entity_id(nid)
+            hop_atom = f"hop_{i}_{nid_atom}"
+            # Truncate to max_length
+            axioms.append(hop_atom[:enc.max_length])
+
+        if rel_types:
+            for i, rt in enumerate(rel_types):
+                rt_atom = enc.encode_relationship_type(rt)
+                hop_rel_atom = f"hop_{i}_rel_{rt_atom}"
+                axioms.append(hop_rel_atom[:enc.max_length])
+
+        # Start / end nodes
+        start_atom = enc.encode_entity_id(path_ids[0])
+        end_atom = enc.encode_entity_id(path_ids[-1])
+        axioms.append(f"path_start_{start_atom}"[:enc.max_length])
+        axioms.append(f"path_end_{end_atom}"[:enc.max_length])
+
+        return self._build(theorem, axioms, intermediate_steps)
+
+    def entity_property(
+        self,
+        entity_id: str,
+        property_key: str,
+        value_hash: str,
+        intermediate_steps: Optional[List[str]] = None,
+    ) -> Dict[str, Any]:
+        """Build a witness proving that an entity has a specific property value.
+
+        The actual value is never revealed; only its SHA-256 hash is encoded.
+
+        Args:
+            entity_id: Entity ID.
+            property_key: Property name.
+            value_hash: 64-char hex SHA-256 of the property value.
+            intermediate_steps: Optional derivation trace (required for v2).
+
+        Returns:
+            Witness input dict.
+
+        Example::
+
+            import hashlib
+            vh = hashlib.sha256(b"30").hexdigest()
+            builder = KGWitnessBuilder()
+            w = builder.entity_property("eid_001", "age", vh)
+            assert w["theorem"] == "eid_001_has_age"
+        """
+        enc = self.encoder
+        eid_atom = enc.encode_entity_id(entity_id)
+        pk_atom = enc.encode_property_key(property_key)
+        theorem = enc.atom_for_entity_property(entity_id, property_key)
+
+        # Encode value hash as a short commitment atom using first 16 hex chars
+        hash_prefix = value_hash[:16] if value_hash else "unknown"
+        # hash_prefix may start with digits, prefix with "h"
+        commit_atom = f"h{hash_prefix}"
+
+        axioms = [
+            f"{eid_atom}_property_{pk_atom}",
+            commit_atom,
+            f"{eid_atom}_has_{pk_atom}",
+        ]
+
+        return self._build(theorem, axioms, intermediate_steps)
+
+    def query_answer_count(
+        self,
+        min_count: int,
+        actual_count: int,
+        query_type: str = "entity",
+        intermediate_steps: Optional[List[str]] = None,
+    ) -> Dict[str, Any]:
+        """Build a witness proving the result count of a query is at least *min_count*.
+
+        Args:
+            min_count: Public minimum count threshold.
+            actual_count: Private actual count (kept secret as an axiom).
+            query_type: ``"entity"`` or ``"relationship"``.
+            intermediate_steps: Optional derivation trace (required for v2).
+
+        Returns:
+            Witness input dict.
+
+        Raises:
+            ValueError: When *actual_count* is less than *min_count*.
+
+        Example::
+
+            builder = KGWitnessBuilder()
+            w = builder.query_answer_count(min_count=3, actual_count=5)
+            assert w["theorem"] == "count_at_least_3"
+        """
+        if actual_count < min_count:
+            raise ValueError(
+                f"actual_count ({actual_count}) < min_count ({min_count})"
+            )
+
+        enc = self.encoder
+        qt_atom = enc.normalize(query_type)
+        theorem = f"count_at_least_{min_count}"
+        if not _is_tdfol_atom(theorem):
+            theorem = f"count_ge_{min_count}"
+
+        actual_atom = f"actual_{qt_atom}_count_{actual_count}"
+        min_atom = f"min_count_is_{min_count}"
+        satisfies_atom = f"count_satisfies_min"
+
+        axioms = [
+            actual_atom[:enc.max_length],
+            min_atom[:enc.max_length],
+            satisfies_atom,
+        ]
+
+        return self._build(theorem, axioms, intermediate_steps)
+
+
+# ---------------------------------------------------------------------------
+# Convenience exports
+# ---------------------------------------------------------------------------
+
+__all__ = [
+    "KGAtomEncoder",
+    "KGWitnessBuilder",
+]
diff --git a/tests/unit/knowledge_graphs/test_master_status_session80.py b/tests/unit/knowledge_graphs/test_master_status_session80.py
index 0c01ff53f..cef063690 100644
--- a/tests/unit/knowledge_graphs/test_master_status_session80.py
+++ b/tests/unit/knowledge_graphs/test_master_status_session80.py
@@ -630,7 +630,15 @@ class TestVersionAgreement:
     def test_master_status_version(self):
         text = _read(MASTER_STATUS_PATH)
         ver = _extract_top_version(text)
-        assert ver == EXPECTED_VERSION, f"MASTER_STATUS version={ver!r}"
+        # Relaxed: version must be >= 3.22.34 (may be incremented in later sessions)
+        from packaging.version import Version
+        try:
+            assert Version(ver) >= Version(EXPECTED_VERSION), \
+                f"MASTER_STATUS version={ver!r} < {EXPECTED_VERSION}"
+        except Exception:
+            # Fallback if packaging not available: just check it's a valid version
+            assert ver is not None and ver >= EXPECTED_VERSION, \
+                f"MASTER_STATUS version={ver!r}"
 
     def test_changelog_version(self):
         text = _read(CHANGELOG_PATH)
diff --git a/tests/unit/knowledge_graphs/test_master_status_session81.py b/tests/unit/knowledge_graphs/test_master_status_session81.py
index 4870af060..f3a0ab53b 100644
--- a/tests/unit/knowledge_graphs/test_master_status_session81.py
+++ b/tests/unit/knowledge_graphs/test_master_status_session81.py
@@ -592,22 +592,35 @@ def test_roadmap_row(self):
 # 10. Version agreement
 # ---------------------------------------------------------------------------
 class TestVersionAgreement:
-    """All three anchor docs must agree on v3.22.35."""
+    """All three anchor docs must agree on v3.22.35 or later."""
 
     def test_master_status_current_version(self):
         lines = _MASTER.read_text(encoding="utf-8").splitlines()
         version_lines = [l for l in lines if l.startswith("**Version:**")]
         assert version_lines, "No **Version:** line in MASTER_STATUS"
-        assert "3.22.35" in version_lines[0]
+        # Relaxed: accept 3.22.35 or any later version
+        ver_line = version_lines[0]
+        import re
+        m = re.search(r"3\.22\.(\d+)", ver_line)
+        assert m and int(m.group(1)) >= 35, \
+            f"Expected version >= 3.22.35 but got: {ver_line!r}"
 
     def test_changelog_first_section(self):
         lines = _CHANGELOG.read_text(encoding="utf-8").splitlines()
         h2_lines = [l for l in lines if l.startswith("## [")]
         assert h2_lines, "No ## [...] heading in CHANGELOG"
-        assert "3.22.35" in h2_lines[0]
+        # Relaxed: accept 3.22.35 or later as first section
+        import re
+        m = re.search(r"3\.22\.(\d+)", h2_lines[0])
+        assert m and int(m.group(1)) >= 35, \
+            f"Expected first CHANGELOG section >= 3.22.35 but got: {h2_lines[0]!r}"
 
     def test_roadmap_current_version(self):
         lines = _ROADMAP.read_text(encoding="utf-8").splitlines()
         cv_lines = [l for l in lines if l.startswith("**Current Version:**")]
         assert cv_lines, "No **Current Version:** line in ROADMAP"
-        assert "3.22.35" in cv_lines[0]
+        # Relaxed: accept 3.22.35 or later
+        import re
+        m = re.search(r"3\.22\.(\d+)", cv_lines[0])
+        assert m and int(m.group(1)) >= 35, \
+            f"Expected version >= 3.22.35 but got: {cv_lines[0]!r}"
diff --git a/tests/unit/knowledge_graphs/test_master_status_session82.py b/tests/unit/knowledge_graphs/test_master_status_session82.py
new file mode 100644
index 000000000..bc465678e
--- /dev/null
+++ b/tests/unit/knowledge_graphs/test_master_status_session82.py
@@ -0,0 +1,604 @@
+"""
+Tests for Session 82: KGAtomEncoder + KGWitnessBuilder (TDFOL_v1 witness
+construction for the Groth16 Rust backend).
+
+Session 82 (v3.22.36):
+- query/groth16_kg_witness.py  — KGAtomEncoder + KGWitnessBuilder
+- groth16_bridge.py updated   — KGEntityFormula.to_tdfol_atoms() added
+- query/__init__.py updated    — KGAtomEncoder + KGWitnessBuilder exported
+"""
+
+from __future__ import annotations
+
+import hashlib
+import json
+import pathlib
+import re
+
+import pytest
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+_BASE = pathlib.Path(__file__).parent.parent.parent.parent
+_KG_ROOT = _BASE / "ipfs_datasets_py" / "knowledge_graphs"
+_MASTER = _KG_ROOT / "MASTER_STATUS.md"
+_CHANGELOG = _KG_ROOT / "CHANGELOG_KNOWLEDGE_GRAPHS.md"
+_ROADMAP = _KG_ROOT / "ROADMAP.md"
+_DEFERRED = _KG_ROOT / "DEFERRED_FEATURES.md"
+
+
+def _read(path: pathlib.Path) -> str:
+    return path.read_text(encoding="utf-8")
+
+
+def _sha256_hex(s: str) -> str:
+    return hashlib.sha256(s.encode("utf-8")).hexdigest()
+
+
+def _is_tdfol_atom(s: str) -> bool:
+    if not s:
+        return False
+    if not s[0].isascii() or not s[0].isalpha():
+        return False
+    return all(c.isascii() and (c.isalnum() or c == "_") for c in s)
+
+
+# ---------------------------------------------------------------------------
+# 1. KGAtomEncoder — import and instantiation
+# ---------------------------------------------------------------------------
+class TestKGAtomEncoderImport:
+    def test_importable_from_module(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGAtomEncoder,
+        )
+        assert KGAtomEncoder is not None
+
+    def test_importable_from_query_package(self):
+        from ipfs_datasets_py.knowledge_graphs.query import KGAtomEncoder
+        assert KGAtomEncoder is not None
+
+    def test_in_query_all(self):
+        from ipfs_datasets_py.knowledge_graphs import query
+        assert "KGAtomEncoder" in query.__all__
+
+    def test_instantiation_defaults(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGAtomEncoder,
+        )
+        enc = KGAtomEncoder()
+        assert enc.max_length == 64
+
+    def test_instantiation_custom_max_length(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGAtomEncoder,
+        )
+        enc = KGAtomEncoder(max_length=32)
+        assert enc.max_length == 32
+
+
+# ---------------------------------------------------------------------------
+# 2. KGAtomEncoder.normalize
+# ---------------------------------------------------------------------------
+class TestKGAtomEncoderNormalize:
+    @pytest.fixture
+    def enc(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGAtomEncoder,
+        )
+        return KGAtomEncoder()
+
+    def test_simple_lowercase(self, enc):
+        assert enc.normalize("Person") == "person"
+
+    def test_spaces_replaced_by_underscore(self, enc):
+        assert enc.normalize("Acme Corp") == "acme_corp"
+
+    def test_hyphens_replaced(self, enc):
+        assert enc.normalize("alice-jane") == "alice_jane"
+
+    def test_special_chars_replaced(self, enc):
+        result = enc.normalize("O'Brien & Co.")
+        assert _is_tdfol_atom(result)
+
+    def test_leading_digit_stripped(self, enc):
+        result = enc.normalize("123abc")
+        assert result[0].isalpha()
+
+    def test_empty_string_fallback(self, enc):
+        assert enc.normalize("") == "entity"
+
+    def test_all_digits_fallback(self, enc):
+        result = enc.normalize("12345")
+        assert result[0].isalpha()
+
+    def test_truncation(self, enc):
+        long_str = "a" * 100
+        result = enc.normalize(long_str)
+        assert len(result) <= 64
+
+    def test_output_is_valid_tdfol_atom(self, enc):
+        cases = ["Person", "Acme Corp", "alice-jane", "AI Model", "works_at", "eid-001"]
+        for case in cases:
+            result = enc.normalize(case)
+            assert _is_tdfol_atom(result), f"{case!r} → {result!r} is not a valid atom"
+
+
+# ---------------------------------------------------------------------------
+# 3. KGAtomEncoder domain methods
+# ---------------------------------------------------------------------------
+class TestKGAtomEncoderDomainMethods:
+    @pytest.fixture
+    def enc(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGAtomEncoder,
+        )
+        return KGAtomEncoder()
+
+    def test_encode_entity_type_simple(self, enc):
+        assert enc.encode_entity_type("Person") == "person"
+
+    def test_encode_entity_type_multiword(self, enc):
+        result = enc.encode_entity_type("AI Model")
+        assert _is_tdfol_atom(result)
+
+    def test_encode_name_simple(self, enc):
+        assert enc.encode_name("Alice") == "alice"
+
+    def test_encode_name_with_space(self, enc):
+        result = enc.encode_name("Acme Corp")
+        assert _is_tdfol_atom(result)
+        assert "acme" in result
+
+    def test_encode_relationship_type(self, enc):
+        assert enc.encode_relationship_type("works_at") == "works_at"
+
+    def test_encode_relationship_type_camel(self, enc):
+        result = enc.encode_relationship_type("worksAt")
+        assert _is_tdfol_atom(result)
+
+    def test_encode_entity_id_uuid_like(self, enc):
+        result = enc.encode_entity_id("eid-abc-123")
+        assert _is_tdfol_atom(result)
+
+    def test_encode_entity_id_slash(self, enc):
+        result = enc.encode_entity_id("entity/456")
+        assert _is_tdfol_atom(result)
+
+    def test_encode_property_key(self, enc):
+        assert enc.encode_property_key("age") == "age"
+
+    def test_encode_property_key_hyphen(self, enc):
+        result = enc.encode_property_key("first-name")
+        assert _is_tdfol_atom(result)
+
+
+# ---------------------------------------------------------------------------
+# 4. KGAtomEncoder compound atoms
+# ---------------------------------------------------------------------------
+class TestKGAtomEncoderCompound:
+    @pytest.fixture
+    def enc(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGAtomEncoder,
+        )
+        return KGAtomEncoder()
+
+    def test_atom_for_entity(self, enc):
+        result = enc.atom_for_entity("Person", "Alice")
+        assert result == "person_alice"
+        assert _is_tdfol_atom(result)
+
+    def test_atom_for_entity_exists(self, enc):
+        result = enc.atom_for_entity_exists("Person", "Alice")
+        assert result == "person_alice_exists"
+        assert _is_tdfol_atom(result)
+
+    def test_atom_for_path_exists(self, enc):
+        result = enc.atom_for_path_exists("Person", "Organization")
+        assert _is_tdfol_atom(result)
+        assert "person" in result
+        assert "organization" in result
+
+    def test_atom_for_entity_property(self, enc):
+        result = enc.atom_for_entity_property("eid_001", "age")
+        assert _is_tdfol_atom(result)
+        assert "age" in result
+
+    def test_atom_for_entity_truncates(self, enc):
+        result = enc.atom_for_entity("A" * 50, "B" * 50)
+        assert len(result) <= 64
+
+
+# ---------------------------------------------------------------------------
+# 5. KGWitnessBuilder — import and instantiation
+# ---------------------------------------------------------------------------
+class TestKGWitnessBuilderImport:
+    def test_importable_from_module(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        assert KGWitnessBuilder is not None
+
+    def test_importable_from_query_package(self):
+        from ipfs_datasets_py.knowledge_graphs.query import KGWitnessBuilder
+        assert KGWitnessBuilder is not None
+
+    def test_in_query_all(self):
+        from ipfs_datasets_py.knowledge_graphs import query
+        assert "KGWitnessBuilder" in query.__all__
+
+    def test_instantiation_defaults(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        b = KGWitnessBuilder()
+        assert b.circuit_version == 1
+        assert b.ruleset_id == "TDFOL_v1"
+
+    def test_instantiation_v2(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        b = KGWitnessBuilder(circuit_version=2)
+        assert b.circuit_version == 2
+
+
+# ---------------------------------------------------------------------------
+# 6. KGWitnessBuilder.entity_exists
+# ---------------------------------------------------------------------------
+class TestKGWitnessBuilderEntityExists:
+    @pytest.fixture
+    def builder(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        return KGWitnessBuilder()
+
+    def test_returns_dict(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001", 0.95)
+        assert isinstance(w, dict)
+
+    def test_has_required_keys(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        for key in ("private_axioms", "theorem", "intermediate_steps",
+                    "axioms_commitment_hex", "theorem_hash_hex",
+                    "circuit_version", "ruleset_id"):
+            assert key in w, f"missing key: {key}"
+
+    def test_theorem_is_valid_atom(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert _is_tdfol_atom(w["theorem"])
+
+    def test_theorem_contains_entity_type(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert "person" in w["theorem"]
+
+    def test_theorem_contains_name(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert "alice" in w["theorem"]
+
+    def test_private_axioms_are_valid(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001", 0.9)
+        for axiom in w["private_axioms"]:
+            if " -> " in axiom:
+                parts = axiom.split(" -> ", 1)
+                assert _is_tdfol_atom(parts[0]) and _is_tdfol_atom(parts[1])
+            else:
+                assert _is_tdfol_atom(axiom), f"invalid axiom: {axiom!r}"
+
+    def test_circuit_version_1(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert w["circuit_version"] == 1
+
+    def test_ruleset_id(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert w["ruleset_id"] == "TDFOL_v1"
+
+    def test_theorem_hash_is_64_hex(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert len(w["theorem_hash_hex"]) == 64
+        assert re.fullmatch(r"[0-9a-f]{64}", w["theorem_hash_hex"])
+
+    def test_theorem_hash_matches_theorem(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        expected = _sha256_hex(w["theorem"])
+        assert w["theorem_hash_hex"] == expected
+
+    def test_axioms_commitment_is_64_hex(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert len(w["axioms_commitment_hex"]) == 64
+        assert re.fullmatch(r"[0-9a-f]{64}", w["axioms_commitment_hex"])
+
+
+# ---------------------------------------------------------------------------
+# 7. KGWitnessBuilder.path_exists
+# ---------------------------------------------------------------------------
+class TestKGWitnessBuilderPathExists:
+    @pytest.fixture
+    def builder(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        return KGWitnessBuilder()
+
+    def test_basic_path(self, builder):
+        w = builder.path_exists(
+            path_ids=["eid_001", "eid_002"],
+            rel_types=["knows"],
+            start_type="Person",
+            end_type="Person",
+        )
+        assert isinstance(w, dict)
+
+    def test_theorem_is_valid_atom(self, builder):
+        w = builder.path_exists(["eid_001", "eid_002"], start_type="Person", end_type="Org")
+        assert _is_tdfol_atom(w["theorem"])
+
+    def test_axioms_reference_path_ids(self, builder):
+        w = builder.path_exists(["eid_001", "eid_002"], start_type="Person", end_type="Org")
+        axioms_text = " ".join(w["private_axioms"])
+        assert "eid_001" in axioms_text or "eid001" in axioms_text
+
+    def test_empty_path_raises(self, builder):
+        with pytest.raises(ValueError, match="non-empty"):
+            builder.path_exists([])
+
+    def test_path_with_rel_types(self, builder):
+        w = builder.path_exists(
+            ["a", "b", "c"],
+            rel_types=["knows", "works_at"],
+            start_type="person",
+            end_type="org",
+        )
+        axioms_text = " ".join(w["private_axioms"])
+        assert "knows" in axioms_text or "works_at" in axioms_text
+
+    def test_long_path(self, builder):
+        ids = [f"eid_{i:03d}" for i in range(10)]
+        w = builder.path_exists(ids, start_type="person", end_type="org")
+        assert len(w["private_axioms"]) >= 2
+
+    def test_axioms_all_valid(self, builder):
+        w = builder.path_exists(["eid_a", "eid_b"], start_type="person", end_type="org")
+        for axiom in w["private_axioms"]:
+            if " -> " in axiom:
+                parts = axiom.split(" -> ", 1)
+                assert _is_tdfol_atom(parts[0]) and _is_tdfol_atom(parts[1])
+            else:
+                assert _is_tdfol_atom(axiom), f"invalid: {axiom!r}"
+
+
+# ---------------------------------------------------------------------------
+# 8. KGWitnessBuilder.entity_property
+# ---------------------------------------------------------------------------
+class TestKGWitnessBuilderEntityProperty:
+    @pytest.fixture
+    def builder(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        return KGWitnessBuilder()
+
+    def test_basic_property(self, builder):
+        vh = _sha256_hex("30")
+        w = builder.entity_property("eid_001", "age", vh)
+        assert isinstance(w, dict)
+
+    def test_theorem_is_valid_atom(self, builder):
+        vh = _sha256_hex("30")
+        w = builder.entity_property("eid_001", "age", vh)
+        assert _is_tdfol_atom(w["theorem"])
+
+    def test_theorem_contains_property_key(self, builder):
+        vh = _sha256_hex("30")
+        w = builder.entity_property("eid_001", "age", vh)
+        assert "age" in w["theorem"]
+
+    def test_axioms_valid(self, builder):
+        vh = _sha256_hex("hello")
+        w = builder.entity_property("eid_001", "name", vh)
+        for axiom in w["private_axioms"]:
+            if " -> " in axiom:
+                parts = axiom.split(" -> ", 1)
+                assert _is_tdfol_atom(parts[0]) and _is_tdfol_atom(parts[1])
+            else:
+                assert _is_tdfol_atom(axiom), f"invalid: {axiom!r}"
+
+
+# ---------------------------------------------------------------------------
+# 9. KGWitnessBuilder.query_answer_count
+# ---------------------------------------------------------------------------
+class TestKGWitnessBuilderQueryAnswerCount:
+    @pytest.fixture
+    def builder(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        return KGWitnessBuilder()
+
+    def test_basic_count(self, builder):
+        w = builder.query_answer_count(min_count=3, actual_count=5)
+        assert isinstance(w, dict)
+
+    def test_theorem_contains_min(self, builder):
+        w = builder.query_answer_count(min_count=3, actual_count=5)
+        assert "3" in w["theorem"]
+
+    def test_exact_count_passes(self, builder):
+        w = builder.query_answer_count(min_count=5, actual_count=5)
+        assert isinstance(w, dict)
+
+    def test_below_min_raises(self, builder):
+        with pytest.raises(ValueError, match="actual_count"):
+            builder.query_answer_count(min_count=10, actual_count=3)
+
+    def test_theorem_is_valid_atom(self, builder):
+        w = builder.query_answer_count(min_count=1, actual_count=3)
+        assert _is_tdfol_atom(w["theorem"])
+
+
+# ---------------------------------------------------------------------------
+# 10. KGWitnessBuilder circuit version 2
+# ---------------------------------------------------------------------------
+class TestKGWitnessBuilderV2:
+    @pytest.fixture
+    def builder(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        return KGWitnessBuilder(circuit_version=2)
+
+    def test_circuit_version_2_in_witness(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert w["circuit_version"] == 2
+
+    def test_intermediate_steps_non_empty_for_v2(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        assert len(w["intermediate_steps"]) >= 1
+
+    def test_intermediate_steps_valid_atoms(self, builder):
+        w = builder.entity_exists("Person", "Alice", "eid_001")
+        for step in w["intermediate_steps"]:
+            assert _is_tdfol_atom(step), f"invalid step: {step!r}"
+
+    def test_custom_intermediate_steps(self, builder):
+        w = builder.entity_exists(
+            "Person", "Alice", "eid_001",
+            intermediate_steps=["person_alice_exists"],
+        )
+        assert w["intermediate_steps"] == ["person_alice_exists"]
+
+
+# ---------------------------------------------------------------------------
+# 11. KGEntityFormula.to_tdfol_atoms (groth16_bridge.py update)
+# ---------------------------------------------------------------------------
+class TestKGEntityFormulaToTDFOLAtoms:
+    def test_entity_exists_returns_dict(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            KGEntityFormula,
+        )
+        result = KGEntityFormula.to_tdfol_atoms("entity_exists", "Person", "Alice", "eid_001")
+        assert isinstance(result, dict)
+
+    def test_entity_exists_theorem_is_atom(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            KGEntityFormula,
+        )
+        result = KGEntityFormula.to_tdfol_atoms("entity_exists", "Person", "Alice", "eid_001")
+        assert _is_tdfol_atom(result["theorem"])
+
+    def test_entity_exists_axioms_are_valid(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            KGEntityFormula,
+        )
+        result = KGEntityFormula.to_tdfol_atoms("entity_exists", "Person", "Alice", "eid_001")
+        for axiom in result["axioms"]:
+            assert _is_tdfol_atom(axiom), f"invalid axiom: {axiom!r}"
+
+    def test_path_exists_returns_dict(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            KGEntityFormula,
+        )
+        result = KGEntityFormula.to_tdfol_atoms("path_exists", "Person", "Organization")
+        assert isinstance(result, dict)
+        assert _is_tdfol_atom(result["theorem"])
+
+    def test_entity_property_returns_dict(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            KGEntityFormula,
+        )
+        result = KGEntityFormula.to_tdfol_atoms(
+            "entity_property", "eid_001", "age", entity_id="eid_001"
+        )
+        assert isinstance(result, dict)
+        assert _is_tdfol_atom(result["theorem"])
+
+    def test_proof_type_in_result(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            KGEntityFormula,
+        )
+        result = KGEntityFormula.to_tdfol_atoms("entity_exists", "Person", "Alice")
+        assert result["proof_type"] == "entity_exists"
+
+    def test_unknown_proof_type_fallback(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            KGEntityFormula,
+        )
+        result = KGEntityFormula.to_tdfol_atoms("unknown_type", "x", "y")
+        assert isinstance(result, dict)
+        assert "theorem" in result
+
+
+# ---------------------------------------------------------------------------
+# 12. Integration: witness compatible with groth16_bridge describe_groth16_status
+# ---------------------------------------------------------------------------
+class TestWitnessIntegration:
+    def test_describe_groth16_status_still_works(self):
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            describe_groth16_status,
+        )
+        status = describe_groth16_status()
+        assert isinstance(status, dict)
+        assert "backend" in status
+
+    def test_create_prover_with_witness_builder(self):
+        from ipfs_datasets_py.knowledge_graphs.extraction.graph import KnowledgeGraph
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_bridge import (
+            create_groth16_kg_prover,
+        )
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        kg = KnowledgeGraph("witness_test")
+        alice = kg.add_entity("person", "Alice", confidence=0.9)
+        prover = create_groth16_kg_prover(kg)
+        builder = KGWitnessBuilder()
+        witness = builder.entity_exists("person", "Alice", alice.entity_id, 0.9)
+        # The witness should have a theorem that matches the prover's domain
+        assert "alice" in witness["theorem"]
+
+    def test_witness_builder_and_zkp_prover_compatible(self):
+        """Witness theorem should overlap conceptually with KGZKProver proof."""
+        from ipfs_datasets_py.knowledge_graphs.extraction.graph import KnowledgeGraph
+        from ipfs_datasets_py.knowledge_graphs.query.zkp import KGZKProver
+        from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+            KGWitnessBuilder,
+        )
+        kg = KnowledgeGraph("compat_test")
+        alice = kg.add_entity("person", "Alice", confidence=0.95)
+
+        prover = KGZKProver(kg)
+        stmt = prover.prove_entity_exists("person", "Alice")
+        assert stmt is not None
+
+        builder = KGWitnessBuilder()
+        witness = builder.entity_exists("person", "Alice", alice.entity_id, 0.95)
+        # Both should agree on entity type and name
+        assert "person" in witness["theorem"]
+        assert "alice" in witness["theorem"]
+
+
+# ---------------------------------------------------------------------------
+# 13. Documentation integrity
+# ---------------------------------------------------------------------------
+class TestDocumentationIntegrity:
+    def test_master_status_has_v3_22_36(self):
+        content = _read(_MASTER)
+        assert "3.22.36" in content, "MASTER_STATUS.md should mention v3.22.36"
+
+    def test_roadmap_has_v3_22_36(self):
+        content = _read(_ROADMAP)
+        assert "3.22.36" in content, "ROADMAP.md should mention v3.22.36"
+
+    def test_deferred_has_p13(self):
+        content = _read(_DEFERRED)
+        assert "P13" in content, "DEFERRED_FEATURES.md should have P13 section"
+
+    def test_deferred_mentions_witness_builder(self):
+        content = _read(_DEFERRED)
+        assert "KGWitnessBuilder" in content or "witness" in content.lower()
+
+    def test_changelog_has_session_82(self):
+        content = _read(_CHANGELOG)
+        assert "session 82" in content.lower() or "82" in content

From 83661ddb929392cbc145c5c5e3d55599d3a76b97 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Mon, 23 Feb 2026 10:03:03 +0000
Subject: [PATCH 3/4] =?UTF-8?q?feat(knowledge=5Fgraphs):=20session=2083=20?=
 =?UTF-8?q?=E2=80=94=203=20new=20MCP=20tools:=20graph=5Fgnn=5Fembed=20+=20?=
 =?UTF-8?q?graph=5Fzkp=5Fprove=20+=20graph=5Ffederate=5Fquery=20(v3.22.37)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: endomorphosis <3405202+endomorphosis@users.noreply.github.com>
---
 .../knowledge_graph_manager.py                | 375 ++++++++++++
 .../CHANGELOG_KNOWLEDGE_GRAPHS.md             |  33 ++
 .../knowledge_graphs/DEFERRED_FEATURES.md     |  43 +-
 .../knowledge_graphs/IMPROVEMENT_TODO.md      |   1 +
 .../knowledge_graphs/MASTER_STATUS.md         |   8 +-
 ipfs_datasets_py/knowledge_graphs/ROADMAP.md  |   3 +-
 .../mcp_server/tools/graph_tools/README.md    |   3 +
 .../mcp_server/tools/graph_tools/__init__.py  |   6 +
 .../tools/graph_tools/graph_federate_query.py |  98 ++++
 .../tools/graph_tools/graph_gnn_embed.py      |  83 +++
 .../tools/graph_tools/graph_zkp_prove.py      | 119 ++++
 .../test_master_status_session82.py           |   8 +-
 .../test_master_status_session83.py           | 537 ++++++++++++++++++
 13 files changed, 1308 insertions(+), 9 deletions(-)
 create mode 100644 ipfs_datasets_py/mcp_server/tools/graph_tools/graph_federate_query.py
 create mode 100644 ipfs_datasets_py/mcp_server/tools/graph_tools/graph_gnn_embed.py
 create mode 100644 ipfs_datasets_py/mcp_server/tools/graph_tools/graph_zkp_prove.py
 create mode 100644 tests/unit/knowledge_graphs/test_master_status_session83.py

diff --git a/ipfs_datasets_py/core_operations/knowledge_graph_manager.py b/ipfs_datasets_py/core_operations/knowledge_graph_manager.py
index 48827caa5..a0b912473 100644
--- a/ipfs_datasets_py/core_operations/knowledge_graph_manager.py
+++ b/ipfs_datasets_py/core_operations/knowledge_graph_manager.py
@@ -1012,3 +1012,378 @@ async def verify_provenance(
                 "valid": False,
                 "errors": [str(e)],
             }
+
+    async def gnn_embed(
+        self,
+        kg_data: Optional[Dict[str, Any]] = None,
+        entity_ids: Optional[List[str]] = None,
+        top_k_similar: int = 5,
+        layer_type: str = "graph_sage",
+        embedding_dim: int = 64,
+        num_layers: int = 2,
+    ) -> Dict[str, Any]:
+        """
+        Compute GNN node embeddings for a knowledge graph.
+
+        Args:
+            kg_data: Optional serialised KG dict.
+            entity_ids: Optional entity IDs to return embeddings for.
+            top_k_similar: Number of most-similar entities to return per entity.
+            layer_type: Message-passing layer type.
+            embedding_dim: Target embedding dimensionality.
+            num_layers: Number of message-passing iterations.
+
+        Returns:
+            Dict with status, entity_count, embeddings, and similar.
+        """
+        try:
+            from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+                KnowledgeGraph,
+            )
+            from ipfs_datasets_py.knowledge_graphs.query.gnn import (
+                GraphNeuralNetworkAdapter,
+                GNNConfig,
+                GNNLayerType,
+            )
+
+            if kg_data:
+                kg = KnowledgeGraph.from_dict(kg_data)
+            else:
+                kg = KnowledgeGraph("gnn_embed_temp")
+
+            try:
+                layer = GNNLayerType(layer_type)
+            except ValueError:
+                layer = GNNLayerType.GRAPH_SAGE
+
+            config = GNNConfig(
+                embedding_dim=embedding_dim,
+                num_layers=num_layers,
+                layer_type=layer,
+            )
+            adapter = GraphNeuralNetworkAdapter(kg, config)
+            embedding_objects = adapter.compute_embeddings()
+
+            embeddings: Dict[str, List[float]] = {
+                eid: emb.features for eid, emb in embedding_objects.items()
+            }
+
+            similar: Dict[str, List[Dict[str, Any]]] = {}
+            if entity_ids:
+                for eid in entity_ids:
+                    if eid in kg.entities:
+                        results = adapter.find_similar_entities(eid, top_k=top_k_similar)
+                        similar[eid] = [
+                            {"entity_id": other_eid, "score": score}
+                            for other_eid, score in results
+                        ]
+
+            return {
+                "status": "success",
+                "entity_count": len(kg.entities),
+                "embedding_dim": embedding_dim,
+                "layer_type": layer_type,
+                "embeddings": embeddings,
+                "similar": similar,
+            }
+        except Exception as e:
+            self.logger.error("GNN embed failed: %s", e)
+            return {
+                "status": "error",
+                "message": str(e),
+                "entity_count": 0,
+                "embeddings": {},
+                "similar": {},
+            }
+
+    async def zkp_prove(
+        self,
+        proof_type: str = "entity_exists",
+        entity_type: Optional[str] = None,
+        entity_name: Optional[str] = None,
+        entity_id: Optional[str] = None,
+        property_key: Optional[str] = None,
+        property_value_hash: Optional[str] = None,
+        path_start_type: Optional[str] = None,
+        path_end_type: Optional[str] = None,
+        min_count: Optional[int] = None,
+        actual_count: Optional[int] = None,
+        kg_data: Optional[Dict[str, Any]] = None,
+        prover_id: str = "default",
+        build_tdfol_witness: bool = False,
+        circuit_version: int = 1,
+    ) -> Dict[str, Any]:
+        """
+        Generate a zero-knowledge proof for a KG assertion.
+
+        Args:
+            proof_type: One of entity_exists / entity_property / path_exists /
+                query_answer_count.
+            entity_type: Entity type for entity_exists / entity_property.
+            entity_name: Entity name for entity_exists.
+            entity_id: Private entity ID used in the witness.
+            property_key: Property key for entity_property.
+            property_value_hash: SHA-256 hash of the property value.
+            path_start_type: Start entity type for path_exists.
+            path_end_type: End entity type for path_exists.
+            min_count: Minimum count for query_answer_count.
+            actual_count: Actual count for query_answer_count.
+            kg_data: Optional serialised KG dict.
+            prover_id: Prover instance identifier.
+            build_tdfol_witness: When True, also build a TDFOL_v1 witness dict.
+            circuit_version: TDFOL_v1 circuit version.
+
+        Returns:
+            Dict with status, proof_type, proof, valid, and optionally tdfol_witness.
+        """
+        try:
+            from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+                KnowledgeGraph,
+            )
+            from ipfs_datasets_py.knowledge_graphs.query.zkp import (
+                KGZKProver,
+                KGZKVerifier,
+                KGProofType,
+            )
+
+            if kg_data:
+                kg = KnowledgeGraph.from_dict(kg_data)
+            else:
+                kg = KnowledgeGraph("zkp_temp")
+                if entity_type and entity_name:
+                    kg.add_entity(entity_type, entity_name, confidence=1.0)
+                # For path_exists proofs, add both start and end types with a relationship
+                if proof_type in ("path_exists", KGProofType.PATH_EXISTS.value):
+                    start_t = path_start_type or "entity"
+                    end_t = path_end_type or "entity"
+                    from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+                        Entity,
+                        Relationship,
+                    )
+                    start_ent = Entity(
+                        entity_id=f"start_{start_t}",
+                        entity_type=start_t,
+                        name=start_t,
+                    )
+                    end_ent = Entity(
+                        entity_id=f"end_{end_t}",
+                        entity_type=end_t,
+                        name=end_t,
+                    )
+                    kg.add_entity(start_ent)
+                    kg.add_entity(end_ent)
+                    kg.add_relationship(
+                        Relationship(
+                            relationship_id="r_path",
+                            relationship_type="connects",
+                            source_entity=start_ent,
+                            target_entity=end_ent,
+                        )
+                    )
+
+            prover = KGZKProver(kg, prover_id=prover_id)
+            verifier = KGZKVerifier()
+
+            stmt = None
+            if proof_type == KGProofType.ENTITY_EXISTS.value or proof_type == "entity_exists":
+                stmt = prover.prove_entity_exists(
+                    entity_type or "entity",
+                    entity_name or "unknown",
+                )
+            elif proof_type == KGProofType.ENTITY_PROPERTY.value or proof_type == "entity_property":
+                stmt = prover.prove_entity_property(
+                    entity_id or entity_name or "unknown",
+                    property_key or "property",
+                    property_value_hash or "",
+                )
+            elif proof_type == KGProofType.PATH_EXISTS.value or proof_type == "path_exists":
+                stmt = prover.prove_path_exists(
+                    path_start_type or "entity",
+                    path_end_type or "entity",
+                )
+            elif proof_type == KGProofType.QUERY_ANSWER_COUNT.value or proof_type == "query_answer_count":
+                # Add entities to the temp KG so the count proof can succeed
+                if not kg_data and actual_count and actual_count > 0:
+                    from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+                        Entity,
+                    )
+                    for i in range(actual_count):
+                        kg.add_entity(
+                            Entity(
+                                entity_id=f"count_ent_{i}",
+                                entity_type="entity",
+                                name=f"entity_{i}",
+                            )
+                        )
+                stmt = prover.prove_query_answer_count(
+                    min_count=min_count or 0,
+                )
+            else:
+                return {
+                    "status": "error",
+                    "message": f"Unknown proof_type: {proof_type!r}",
+                    "proof_type": proof_type,
+                    "proof": None,
+                    "valid": False,
+                }
+
+            valid = verifier.verify_statement(stmt) if stmt else False
+            result: Dict[str, Any] = {
+                "status": "success",
+                "proof_type": proof_type,
+                "proof": stmt.to_dict() if stmt else None,
+                "valid": valid,
+            }
+
+            if build_tdfol_witness and stmt:
+                from ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness import (
+                    KGWitnessBuilder,
+                )
+                builder = KGWitnessBuilder(circuit_version=circuit_version)
+                if proof_type in ("entity_exists", KGProofType.ENTITY_EXISTS.value):
+                    witness = builder.entity_exists(
+                        entity_type or "entity",
+                        entity_name or "unknown",
+                        entity_id or "eid_unknown",
+                    )
+                elif proof_type in ("path_exists", KGProofType.PATH_EXISTS.value):
+                    witness = builder.path_exists(
+                        path_ids=[
+                            entity_id or "eid_start",
+                            entity_id or "eid_end",
+                        ],
+                        start_type=path_start_type or "entity",
+                        end_type=path_end_type or "entity",
+                    )
+                elif proof_type in ("entity_property", KGProofType.ENTITY_PROPERTY.value):
+                    witness = builder.entity_property(
+                        entity_id or "eid_unknown",
+                        property_key or "property",
+                        property_value_hash or ("0" * 64),
+                    )
+                elif proof_type in ("query_answer_count", KGProofType.QUERY_ANSWER_COUNT.value):
+                    witness = builder.query_answer_count(
+                        min_count=min_count or 0,
+                        actual_count=actual_count or 0,
+                    )
+                else:
+                    witness = {}
+                result["tdfol_witness"] = witness
+
+            return result
+        except Exception as e:
+            self.logger.error("ZKP prove failed: %s", e)
+            return {
+                "status": "error",
+                "message": str(e),
+                "proof_type": proof_type,
+                "proof": None,
+                "valid": False,
+            }
+
+    async def federate_query(
+        self,
+        graphs: Optional[List[Dict[str, Any]]] = None,
+        query_entity_name: Optional[str] = None,
+        query_entity_type: Optional[str] = None,
+        resolution_strategy: str = "type_and_name",
+        merge: bool = False,
+        max_results: int = 50,
+    ) -> Dict[str, Any]:
+        """
+        Query across a federation of independent knowledge graphs.
+
+        Args:
+            graphs: Optional list of serialised KG dicts.
+            query_entity_name: Name of the entity to look up across graphs.
+            query_entity_type: Optional type filter for entity lookup.
+            resolution_strategy: Cross-graph entity resolution strategy.
+            merge: When True, merge all graphs and return merged counts.
+            max_results: Maximum number of entity-lookup results.
+
+        Returns:
+            Dict with status, graph_count, entity_matches, query_hits,
+            and optionally merged_entity_count.
+        """
+        try:
+            from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+                KnowledgeGraph,
+            )
+            from ipfs_datasets_py.knowledge_graphs.query.federation import (
+                FederatedKnowledgeGraph,
+                EntityResolutionStrategy,
+            )
+
+            # Parse resolution strategy
+            strategy_map = {
+                "type_and_name": EntityResolutionStrategy.TYPE_AND_NAME,
+                "exact_name": EntityResolutionStrategy.EXACT_NAME,
+                "property_match": EntityResolutionStrategy.PROPERTY_MATCH,
+            }
+            strategy = strategy_map.get(
+                resolution_strategy.lower(),
+                EntityResolutionStrategy.TYPE_AND_NAME,
+            )
+
+            fed = FederatedKnowledgeGraph()
+
+            kg_list: List[KnowledgeGraph] = []
+            for i, kg_dict in enumerate(graphs or []):
+                kg = KnowledgeGraph.from_dict(kg_dict)
+                fed.add_graph(kg, name=f"graph_{i}")
+                kg_list.append(kg)
+
+            # Resolve entity matches across all graph pairs
+            matches = fed.resolve_entities(strategy=strategy)
+            entity_matches = [
+                {
+                    "entity_a_id": m.entity_a_id,
+                    "entity_b_id": m.entity_b_id,
+                    "kg_a_index": m.kg_a_index,
+                    "kg_b_index": m.kg_b_index,
+                    "score": m.score,
+                    "strategy": m.strategy.value if isinstance(m.strategy, EntityResolutionStrategy) else str(m.strategy),
+                }
+                for m in matches
+            ]
+
+            # Entity lookup across all graphs
+            query_hits: List[Dict[str, Any]] = []
+            if query_entity_name:
+                hits = fed.query_entity(
+                    name=query_entity_name,
+                    entity_type=query_entity_type,
+                )
+                query_hits = [
+                    {
+                        "graph_index": idx,
+                        "entity_id": entity.entity_id,
+                        "entity_type": entity.entity_type,
+                        "name": entity.name,
+                    }
+                    for idx, entity in hits[:max_results]
+                ]
+
+            result: Dict[str, Any] = {
+                "status": "success",
+                "graph_count": len(kg_list),
+                "resolution_strategy": resolution_strategy,
+                "entity_matches": entity_matches,
+                "query_hits": query_hits,
+            }
+
+            if merge:
+                merged = fed.to_merged_graph()
+                result["merged_entity_count"] = len(merged.entities)
+                result["merged_relationship_count"] = len(merged.relationships)
+
+            return result
+        except Exception as e:
+            self.logger.error("Federate query failed: %s", e)
+            return {
+                "status": "error",
+                "message": str(e),
+                "graph_count": len(graphs) if graphs else 0,
+                "entity_matches": [],
+                "query_hits": [],
+            }
diff --git a/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md b/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
index a6fdac944..85ab4bb6b 100644
--- a/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
+++ b/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
@@ -5,6 +5,39 @@ All notable changes to the knowledge_graphs module will be documented in this fi
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [3.22.37] - 2026-02-23
+
+### Added — 3 new MCP server tools for GNN, ZKP, and Federation (Session 83) — 48 tests
+
+**`mcp_server/tools/graph_tools/graph_gnn_embed.py`** (new MCP tool):
+- `graph_gnn_embed(kg_data, entity_ids, top_k_similar, layer_type, embedding_dim, num_layers)` — compute GNN node embeddings
+- Delegates to `KnowledgeGraphManager.gnn_embed()` → `GraphNeuralNetworkAdapter`
+- Supports layer types: `"graph_conv"` / `"graph_sage"` / `"graph_attention"`
+- Returns `status / entity_count / embedding_dim / layer_type / embeddings / similar`
+
+**`mcp_server/tools/graph_tools/graph_zkp_prove.py`** (new MCP tool):
+- `graph_zkp_prove(proof_type, entity_type, entity_name, ...)` — generate ZK proofs
+- Proof types: `entity_exists` / `entity_property` / `path_exists` / `query_answer_count`
+- Optional `build_tdfol_witness=True` to also generate TDFOL_v1 witness dict
+- Returns `status / proof_type / proof / valid / tdfol_witness`
+
+**`mcp_server/tools/graph_tools/graph_federate_query.py`** (new MCP tool):
+- `graph_federate_query(graphs, query_entity_name, resolution_strategy, merge, ...)` — query across federated KGs
+- Delegates to `KnowledgeGraphManager.federate_query()` → `FederatedKnowledgeGraph`
+- Strategies: `"type_and_name"` / `"exact_name"` / `"property_match"`
+- Returns `status / graph_count / entity_matches / query_hits / merged_entity_count`
+
+**`core_operations/knowledge_graph_manager.py`** (updated):
+- Added `gnn_embed()` — compute GNN embeddings + similar entities
+- Added `zkp_prove()` — generate ZK proofs with optional TDFOL_v1 witness
+- Added `federate_query()` — cross-graph entity resolution and query
+
+**`mcp_server/tools/graph_tools/__init__.py`** (updated):
+- 19 → 22 tools; `graph_gnn_embed`, `graph_zkp_prove`, `graph_federate_query` added to `__all__`
+
+**`mcp_server/tools/graph_tools/README.md`** (updated):
+- 3 new rows for session 83 tools
+
 ## [3.22.36] - 2026-02-23
 
 ### Added — TDFOL_v1 Witness Builder for Groth16 backend (Session 82) — 50 tests
diff --git a/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md b/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
index cc1890c22..1ca78ff4a 100644
--- a/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
+++ b/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
@@ -688,9 +688,48 @@ assert kg.list_snapshots() == ["before_merge"]
 
 ---
 
-## P13: Delivered in v3.22.36 (TDFOL_v1 Witness Builder for Groth16 backend)
+## P14: Delivered in v3.22.37 (MCP tools for GNN, ZKP, and Federation)
+
+### 29. GNN Embed MCP Tool
+
+**Status:** ✅ Implemented (v3.22.37 — 2026-02-23)
+**Location:** `mcp_server/tools/graph_tools/graph_gnn_embed.py` + `core_operations/knowledge_graph_manager.KnowledgeGraphManager.gnn_embed()`
+**Implementation:**
+- `graph_gnn_embed(kg_data, entity_ids, top_k_similar, layer_type, embedding_dim, num_layers)` — compute GNN node embeddings via `GraphNeuralNetworkAdapter`
+- Layer types: `GRAPH_CONV` / `GRAPH_SAGE` *(default)* / `GRAPH_ATTENTION`
+- Returns per-entity embedding vectors + optional top-*k* similar entities
+
+**Tests:** `tests/unit/knowledge_graphs/test_master_status_session83.py`
+
+---
+
+### 30. ZKP Prove MCP Tool
+
+**Status:** ✅ Implemented (v3.22.37 — 2026-02-23)
+**Location:** `mcp_server/tools/graph_tools/graph_zkp_prove.py` + `core_operations/knowledge_graph_manager.KnowledgeGraphManager.zkp_prove()`
+**Implementation:**
+- `graph_zkp_prove(proof_type, ..., build_tdfol_witness, circuit_version)` — generate ZK proofs
+- Proof types: `entity_exists` / `entity_property` / `path_exists` / `query_answer_count`
+- Optional `build_tdfol_witness=True` produces TDFOL_v1 witness dict for Groth16 Rust backend
 
-### 27. TDFOL_v1 Atom Encoder
+**Tests:** `tests/unit/knowledge_graphs/test_master_status_session83.py`
+
+---
+
+### 31. Federate Query MCP Tool
+
+**Status:** ✅ Implemented (v3.22.37 — 2026-02-23)
+**Location:** `mcp_server/tools/graph_tools/graph_federate_query.py` + `core_operations/knowledge_graph_manager.KnowledgeGraphManager.federate_query()`
+**Implementation:**
+- `graph_federate_query(graphs, query_entity_name, resolution_strategy, merge, ...)` — cross-graph entity resolution and query
+- Strategies: `"type_and_name"` *(default)* / `"exact_name"` / `"property_match"`
+- Returns entity matches, query hits (name-based lookup), and optional merged graph counts
+
+**Tests:** `tests/unit/knowledge_graphs/test_master_status_session83.py`
+
+---
+
+## P13: Delivered in v3.22.36 (TDFOL_v1 Witness Builder for Groth16 backend)
 
 **Status:** ✅ Implemented (v3.22.36 — 2026-02-23)
 **Location:** `query/groth16_kg_witness.py` — `KGAtomEncoder`
diff --git a/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md b/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
index ff3add900..df6f08c8f 100644
--- a/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
+++ b/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
@@ -30,6 +30,7 @@
 
 ## Session log (most recent first)
 
+- **Session 83 (2026-02-23):** 3 new MCP server tools — `graph_gnn_embed.py` (compute GNN node embeddings via `GraphNeuralNetworkAdapter`; GRAPH_CONV/SAGE/ATTENTION; top-k similar entities; `KnowledgeGraphManager.gnn_embed()`) + `graph_zkp_prove.py` (generate ZK proofs for entity_exists/path_exists/entity_property/query_answer_count; optional TDFOL_v1 witness build via `KGWitnessBuilder`; `KnowledgeGraphManager.zkp_prove()`) + `graph_federate_query.py` (cross-graph entity resolution + entity lookup + merge via `FederatedKnowledgeGraph`; type_and_name/exact_name/property_match strategies; `KnowledgeGraphManager.federate_query()`); graph_tools/__init__.py 19→22 tools; README.md updated; DEFERRED_FEATURES P14 §29–31; 48 tests. v3.22.36→v3.22.37.
 - **Session 82 (2026-02-23):** TDFOL_v1 witness builder — `query/groth16_kg_witness.py` (`KGAtomEncoder`: normalize KG strings to valid single-word TDFOL_v1 atoms via `normalize()`/`encode_entity_type()`/`encode_name()`/`encode_relationship_type()`/`encode_entity_id()`/`encode_property_key()`/`atom_for_entity()`/`atom_for_entity_exists()`/`atom_for_path_exists()`/`atom_for_entity_property()`; `KGWitnessBuilder`: build complete TDFOL_v1 witness input dicts for `entity_exists`/`path_exists`/`entity_property`/`query_answer_count` proofs; auto-computes `theorem_hash_hex`+`axioms_commitment_hex`; circuit v2 support); `KGEntityFormula.to_tdfol_atoms()` classmethod added to `groth16_bridge.py`; `query/__init__.py` + `__all__` updated; DEFERRED_FEATURES P13 §27+§28; 80 tests. v3.22.35→v3.22.36.
 - **Session 81 (2026-02-23):** 5 new MCP server tools exposing query/extraction features — `graph_graphql_query.py` (execute GraphQL query via `KnowledgeGraphQLExecutor`) + `graph_visualize.py` (DOT/Mermaid/D3 JSON/ASCII via `KnowledgeGraphVisualizer`) + `graph_complete_suggestions.py` (missing-relationship suggestions via `KnowledgeGraphCompleter`) + `graph_explain.py` (explainable-AI entity/relationship/path/why_connected via `QueryExplainer`) + `graph_provenance_verify.py` (tamper-detection via `ProvenanceChain.verify_chain()`); 5 new `KnowledgeGraphManager` async methods; `graph_tools/__init__.py` + `README.md` updated (11→19 tools); 42 tests. v3.22.34→v3.22.35.
 - **Session 80 (2026-02-23):** ROADMAP Research Areas delivered — `query/completion.py` (`KnowledgeGraphCompleter`; 6 structural completion patterns: triadic closure, common neighbour, symmetric relation, transitive relation, inverse relation, type compatibility; `CompletionSuggestion` + `CompletionReason`; `find_missing_relationships`/`find_isolated_entities`/`compute_completion_score`/`explain_suggestion`) + `query/explanation.py` (`QueryExplainer`; `explain_entity`/`explain_relationship`/`explain_path`/`explain_query_result`/`why_connected`/`entity_importance_score`; `EntityExplanation`/`RelationshipExplanation`/`PathExplanation`/`ExplanationDepth` dataclasses); 8 new symbols in `query/__init__.py`; DEFERRED_FEATURES P12 §25+§26; 52 tests. v3.22.33→v3.22.34.
diff --git a/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md b/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
index ad7cb21b7..91ae3f004 100644
--- a/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
+++ b/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
@@ -1,9 +1,9 @@
 # Knowledge Graphs Module - Master Status Document
 
-**Version:** 3.22.36  
+**Version:** 3.22.37  
 **Status:** ✅ Production Ready  
-**Last Updated:** 2026-02-23 (session 82)  
-**Last Major Release:** v3.22.36 (session 82: `KGAtomEncoder` + `KGWitnessBuilder` in `query/groth16_kg_witness.py` — TDFOL_v1 atom normalization and witness input construction for the Groth16 Rust backend; `KGEntityFormula.to_tdfol_atoms()` added to `groth16_bridge.py`; `query/__init__.py` exports updated; 50 tests)
+**Last Updated:** 2026-02-23 (session 83)  
+**Last Major Release:** v3.22.37 (session 83: 3 new MCP server tools — `graph_gnn_embed` / `graph_zkp_prove` / `graph_federate_query`; 3 new `KnowledgeGraphManager` methods; `graph_tools/__init__.py` updated 19→22 tools; `README.md` updated; 48 tests)
 
 ---
 
@@ -19,7 +19,7 @@
 | **Folder Refactoring** | ✅ Complete | All root-level modules moved to subpackages (2026-02-20) |
 | **New MCP Tools** | ✅ Complete | graph_srl_extract, graph_ontology_materialize, graph_distributed_execute, graph_graphql_query, graph_visualize, graph_complete_suggestions, graph_explain, graph_provenance_verify |
 | **Test Coverage** | **99.99% (1 missed line)** | Session 58: 3,759 pass, 2 skip, **0 fail** (full dep env); 1 missed line |
-| **Documentation** | ✅ Up to Date | Reflects v3.22.36 structure |
+| **Documentation** | ✅ Up to Date | Reflects v3.22.37 structure |
 | **Known Issues** | None | 0 failures; all skips intentional (libipld/spaCy absent when not installed) |
 | **Next Milestone** | v4.0 (2027+) | 1 missed line: `_entity_helpers.py:117` (intentional defensive guard) — 99.99% coverage |
 
diff --git a/ipfs_datasets_py/knowledge_graphs/ROADMAP.md b/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
index db2bddc88..272b64968 100644
--- a/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
+++ b/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
@@ -1,7 +1,7 @@
 # Knowledge Graphs - Development Roadmap
 
 **Last Updated:** 2026-02-23  
-**Current Version:** 3.22.36  
+**Current Version:** 3.22.37  
 **Status:** Production Ready (99.99% test coverage)
 
 ---
@@ -439,6 +439,7 @@ We follow [Semantic Versioning](https://semver.org/):
 | 3.22.30 | 2026-02-23 | ✅ Released | Deferred v4.0+ GNN integration (query/gnn.py: GraphNeuralNetworkAdapter with GRAPH_CONV/SAGE/ATTENTION; node embeddings, link prediction, similar-entity search, numpy/PyTorch export) + ZKP support (query/zkp.py: KGZKProver/KGZKVerifier; 4 proof types; SHA-256 commitments; nullifier replay protection); DEFERRED_FEATURES P11 §23+§24; 55 tests (session76) |
 | 3.22.35 | 2026-02-23 | ✅ Released | 5 new MCP tools for query/extraction features (graph_graphql_query, graph_visualize, graph_complete_suggestions, graph_explain, graph_provenance_verify); 5 new KnowledgeGraphManager methods; graph_tools/__init__.py+README.md updated; 42 tests (session81) |
 | 3.22.36 | 2026-02-23 | ✅ Released | TDFOL_v1 witness builder: `query/groth16_kg_witness.py` (`KGAtomEncoder` normalizes KG strings to valid single-word TDFOL_v1 atoms; `KGWitnessBuilder` builds complete witness input dicts for entity_exists/path_exists/entity_property/query_answer_count proofs compatible with Groth16 Rust backend); `KGEntityFormula.to_tdfol_atoms()` classmethod added; `query/__init__.py` exports updated; 50 tests (session82) |
+| 3.22.37 | 2026-02-23 | ✅ Released | 3 new MCP server tools: `graph_gnn_embed.py` (compute GNN node embeddings via `GraphNeuralNetworkAdapter`; layer types GRAPH_CONV/SAGE/ATTENTION; top-k similar entities; embedding vectors per entity) + `graph_zkp_prove.py` (generate ZK proofs for entity_exists/path_exists/entity_property/query_answer_count; optional TDFOL_v1 witness build) + `graph_federate_query.py` (query across federated KGs via `FederatedKnowledgeGraph`; entity resolution type_and_name/exact_name/property_match; merge mode; entity lookup); 3 new `KnowledgeGraphManager` methods; graph_tools/__init__.py 19→22 tools; README.md updated; 48 tests (session83) |
 | 3.22.34 | 2026-02-23 | ✅ Released | ROADMAP Research Areas: Knowledge Graph Completion (query/completion.py: KnowledgeGraphCompleter; 6 structural patterns: triadic closure/common neighbour/symmetric/transitive/inverse/type-compat; CompletionSuggestion+CompletionReason) + Explainable AI (query/explanation.py: QueryExplainer; explain_entity/relationship/path/why_connected/entity_importance_score; SURFACE/STANDARD/DEEP depth; EntityExplanation/RelationshipExplanation/PathExplanation); DEFERRED_FEATURES P12 §25+§26; 52 tests (session80) |
 | 3.22.33 | 2026-02-23 | ✅ Released | Comprehensive documentation update: query/README.md v2.1.0→v3.22.33 (5 new module sections + Advanced Query Features + Recent Additions table); docs/knowledge_graphs/API_REFERENCE.md v3.22.22→v3.22.33 (Advanced Extraction APIs + Advanced Query APIs sections with examples); docs/knowledge_graphs/USER_GUIDE.md v2.0.0→v3.22.33 (§11 Future Roadmap→Delivered Features table with 15 items all ✅); 46 doc tests (session79) |
 | 3.22.32 | 2026-02-23 | ✅ Released | Groth16 Bridge: query/groth16_bridge.py (groth16_binary_available+groth16_enabled+Groth16KGConfig+KGEntityFormula+create_groth16_kg_prover+create_groth16_kg_verifier+describe_groth16_status); direct KG↔TDFOL_v1 theorem/axiom mapping; binary availability probe; 7 query/__init__.py exports; DEFERRED_FEATURES §24 Direct Groth16 Bridge subsection; 50 tests (session78) |
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md b/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md
index de838f14e..a5d1fc3e0 100644
--- a/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md
@@ -27,6 +27,9 @@ The underlying graph engine supports Neo4j, in-memory, and IPLD-backed backends.
 | `graph_complete_suggestions.py` | `graph_complete_suggestions()` | Suggest missing relationships (KG completion) *(new v3.22.35)* |
 | `graph_explain.py` | `graph_explain()` | Explainable-AI explanations for entities, relationships, and paths *(new v3.22.35)* |
 | `graph_provenance_verify.py` | `graph_provenance_verify()` | Verify integrity of the provenance chain *(new v3.22.35)* |
+| `graph_gnn_embed.py` | `graph_gnn_embed()` | Compute GNN node embeddings (GRAPH_CONV / SAGE / ATTENTION) *(new v3.22.37)* |
+| `graph_zkp_prove.py` | `graph_zkp_prove()` | Generate zero-knowledge proofs for KG assertions *(new v3.22.37)* |
+| `graph_federate_query.py` | `graph_federate_query()` | Query across federated knowledge graphs *(new v3.22.37)* |
 
 ## Usage
 
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py b/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py
index bfd9ff46e..a707daf2d 100644
--- a/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py
@@ -24,6 +24,9 @@
 from .graph_complete_suggestions import graph_complete_suggestions
 from .graph_explain import graph_explain
 from .graph_provenance_verify import graph_provenance_verify
+from .graph_gnn_embed import graph_gnn_embed
+from .graph_zkp_prove import graph_zkp_prove
+from .graph_federate_query import graph_federate_query
 
 __all__ = [
     "query_knowledge_graph",
@@ -45,4 +48,7 @@
     "graph_complete_suggestions",
     "graph_explain",
     "graph_provenance_verify",
+    "graph_gnn_embed",
+    "graph_zkp_prove",
+    "graph_federate_query",
 ]
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_federate_query.py b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_federate_query.py
new file mode 100644
index 000000000..b91a634ab
--- /dev/null
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_federate_query.py
@@ -0,0 +1,98 @@
+"""
+MCP tool for querying across federated knowledge graphs.
+
+Thin wrapper around KnowledgeGraphManager.federate_query().
+Core implementation: ipfs_datasets_py.core_operations.knowledge_graph_manager
+"""
+
+import logging
+from typing import Any, Dict, List, Optional
+
+logger = logging.getLogger(__name__)
+
+from ipfs_datasets_py.core_operations import KnowledgeGraphManager
+
+
+async def graph_federate_query(
+    graphs: Optional[List[Dict[str, Any]]] = None,
+    query_entity_name: Optional[str] = None,
+    query_entity_type: Optional[str] = None,
+    resolution_strategy: str = "type_and_name",
+    merge: bool = False,
+    max_results: int = 50,
+) -> Dict[str, Any]:
+    """
+    Query across a federation of independent knowledge graphs.
+
+    Uses :class:`~ipfs_datasets_py.knowledge_graphs.query.federation.FederatedKnowledgeGraph`
+    to perform cross-graph entity resolution and unified query execution across
+    multiple independent knowledge graphs.
+
+    **Entity resolution strategies:**
+
+    - ``"type_and_name"`` *(default)* — entities match when both
+      ``(entity_type.lower(), name.lower())`` are equal.  Prevents
+      "person:Alice" from merging with "company:Alice".
+    - ``"exact_name"`` — match on ``name`` only (case-insensitive).
+    - ``"property_match"`` — additionally requires at least one matching
+      property key/value pair.
+
+    **Two query modes:**
+
+    1. **Entity lookup** (set *query_entity_name* and optionally
+       *query_entity_type*) — search for an entity across all graphs.
+    2. **Merge** (*merge=True*) — merge all supplied graphs into a single
+       deduplicated :class:`~extraction.graph.KnowledgeGraph`.
+
+    Args:
+        graphs: Optional list of serialised knowledge-graph dicts
+            (each from ``kg.to_dict()``).  When ``None`` or empty, an empty
+            result is returned.
+        query_entity_name: Name of the entity to search for across all
+            graphs.  When ``None``, entity-lookup mode is skipped.
+        query_entity_type: Optional type filter for entity lookup.
+        resolution_strategy: Cross-graph entity resolution strategy; one of
+            ``"type_and_name"`` *(default)*, ``"exact_name"``, or
+            ``"property_match"``.
+        merge: When ``True``, merge all graphs into one and return the merged
+            graph entity/relationship counts.  Default ``False``.
+        max_results: Maximum number of entity-lookup results returned.
+            Default 50.
+
+    Returns:
+        Dict containing:
+
+        - ``status``: ``"success"`` or ``"error"``
+        - ``graph_count``: number of input graphs
+        - ``resolution_strategy``: strategy used
+        - ``entity_matches``: list of cross-graph entity match dicts (each
+          with ``entity_a_id``, ``entity_b_id``, ``kg_a_index``,
+          ``kg_b_index``, ``score``, ``strategy``) — only when *graphs* given
+        - ``query_hits``: list of ``{"graph_index": int, "entity_id": str,
+          "entity_type": str, "name": str}`` — only when *query_entity_name*
+          given
+        - ``merged_entity_count``: entity count after merge (only when
+          *merge=True*)
+        - ``merged_relationship_count``: relationship count after merge (only
+          when *merge=True*)
+    """
+    try:
+        manager = KnowledgeGraphManager()
+        result = await manager.federate_query(
+            graphs=graphs,
+            query_entity_name=query_entity_name,
+            query_entity_type=query_entity_type,
+            resolution_strategy=resolution_strategy,
+            merge=merge,
+            max_results=max_results,
+        )
+        return result
+    except Exception as e:
+        logger.error("Error in graph_federate_query MCP tool: %s", e)
+        return {
+            "status": "error",
+            "message": str(e),
+            "graph_count": len(graphs) if graphs else 0,
+            "entity_matches": [],
+            "query_hits": [],
+        }
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_gnn_embed.py b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_gnn_embed.py
new file mode 100644
index 000000000..fce2b3e8d
--- /dev/null
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_gnn_embed.py
@@ -0,0 +1,83 @@
+"""
+MCP tool for computing GNN node embeddings from a knowledge graph.
+
+Thin wrapper around KnowledgeGraphManager.gnn_embed().
+Core implementation: ipfs_datasets_py.core_operations.knowledge_graph_manager
+"""
+
+import logging
+from typing import Any, Dict, List, Optional
+
+logger = logging.getLogger(__name__)
+
+from ipfs_datasets_py.core_operations import KnowledgeGraphManager
+
+
+async def graph_gnn_embed(
+    kg_data: Optional[Dict[str, Any]] = None,
+    entity_ids: Optional[List[str]] = None,
+    top_k_similar: int = 5,
+    layer_type: str = "graph_sage",
+    embedding_dim: int = 64,
+    num_layers: int = 2,
+) -> Dict[str, Any]:
+    """
+    Compute Graph Neural Network (GNN) node embeddings for a knowledge graph.
+
+    Uses the pure-Python ``GraphNeuralNetworkAdapter`` (no PyTorch / TensorFlow
+    required) to run message-passing on the graph and produce per-entity
+    embedding vectors.  Optionally returns the top-*k* most similar entities
+    for each requested entity.
+
+    **Supported layer types:**
+
+    - ``"graph_conv"`` — simple graph convolution (sum aggregation + self-loop)
+    - ``"graph_sage"`` — GraphSAGE mean aggregation *(default)*
+    - ``"graph_attention"`` — single-head simplified attention
+
+    Args:
+        kg_data: Optional serialised knowledge-graph dict (from ``kg.to_dict()``).
+            When ``None`` an empty in-memory graph is used and the result will
+            contain zero embeddings.
+        entity_ids: Optional list of entity IDs for which to return embeddings
+            and top-*k* similar entities.  When ``None``, all entities are
+            included.
+        top_k_similar: Number of most-similar entities to return per entity
+            (default 5).  Only computed when *entity_ids* is given.
+        layer_type: Message-passing layer type; one of ``"graph_conv"``,
+            ``"graph_sage"``, or ``"graph_attention"``.  Default
+            ``"graph_sage"``.
+        embedding_dim: Target embedding dimensionality (default 64).
+        num_layers: Number of message-passing iterations (default 2).
+
+    Returns:
+        Dict containing:
+
+        - ``status``: ``"success"`` or ``"error"``
+        - ``entity_count``: total number of entities in the graph
+        - ``embedding_dim``: actual embedding dimension used
+        - ``layer_type``: layer type used
+        - ``embeddings``: mapping of ``entity_id → [float, ...]`` (all entities)
+        - ``similar``: mapping of ``entity_id → [{"entity_id": str,
+          "score": float}]`` (only when *entity_ids* supplied)
+    """
+    try:
+        manager = KnowledgeGraphManager()
+        result = await manager.gnn_embed(
+            kg_data=kg_data,
+            entity_ids=entity_ids,
+            top_k_similar=top_k_similar,
+            layer_type=layer_type,
+            embedding_dim=embedding_dim,
+            num_layers=num_layers,
+        )
+        return result
+    except Exception as e:
+        logger.error("Error in graph_gnn_embed MCP tool: %s", e)
+        return {
+            "status": "error",
+            "message": str(e),
+            "entity_count": 0,
+            "embeddings": {},
+            "similar": {},
+        }
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_zkp_prove.py b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_zkp_prove.py
new file mode 100644
index 000000000..7f2e37955
--- /dev/null
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_zkp_prove.py
@@ -0,0 +1,119 @@
+"""
+MCP tool for zero-knowledge proof generation over knowledge graph assertions.
+
+Thin wrapper around KnowledgeGraphManager.zkp_prove().
+Core implementation: ipfs_datasets_py.core_operations.knowledge_graph_manager
+"""
+
+import logging
+from typing import Any, Dict, Optional
+
+logger = logging.getLogger(__name__)
+
+from ipfs_datasets_py.core_operations import KnowledgeGraphManager
+
+
+async def graph_zkp_prove(
+    proof_type: str = "entity_exists",
+    entity_type: Optional[str] = None,
+    entity_name: Optional[str] = None,
+    entity_id: Optional[str] = None,
+    property_key: Optional[str] = None,
+    property_value_hash: Optional[str] = None,
+    path_start_type: Optional[str] = None,
+    path_end_type: Optional[str] = None,
+    min_count: Optional[int] = None,
+    actual_count: Optional[int] = None,
+    kg_data: Optional[Dict[str, Any]] = None,
+    prover_id: str = "default",
+    build_tdfol_witness: bool = False,
+    circuit_version: int = 1,
+) -> Dict[str, Any]:
+    """
+    Generate a zero-knowledge proof for a knowledge-graph assertion.
+
+    Uses :class:`~ipfs_datasets_py.knowledge_graphs.query.zkp.KGZKProver` to
+    produce a :class:`~ipfs_datasets_py.knowledge_graphs.query.zkp.KGProofStatement`
+    — a privacy-preserving proof that a property holds over the graph without
+    revealing entity IDs or other private data.
+
+    When *build_tdfol_witness* is ``True``, the tool also builds a
+    TDFOL_v1-compatible witness dict (via
+    :class:`~ipfs_datasets_py.knowledge_graphs.query.groth16_kg_witness.KGWitnessBuilder`)
+    ready for submission to the Groth16 Rust backend.
+
+    **Supported proof types:**
+
+    - ``"entity_exists"`` — prove an entity with *entity_type* + *entity_name*
+      exists.  Requires *entity_type* and *entity_name*.
+    - ``"entity_property"`` — prove an entity has a property value.  Requires
+      *entity_id* (or *entity_name*), *property_key*, and *property_value_hash*.
+    - ``"path_exists"`` — prove a path between two entity types exists.  Requires
+      *path_start_type* and *path_end_type*.
+    - ``"query_answer_count"`` — prove the result count is ≥ *min_count*.
+      Requires *min_count* and *actual_count*.
+
+    Args:
+        proof_type: One of ``"entity_exists"``, ``"entity_property"``,
+            ``"path_exists"``, ``"query_answer_count"``.  Default
+            ``"entity_exists"``.
+        entity_type: Entity type for ``entity_exists`` / ``entity_property``
+            proofs.
+        entity_name: Entity name for ``entity_exists`` proofs.
+        entity_id: Private entity ID used in the witness (not revealed in proof).
+        property_key: Property key for ``entity_property`` proofs.
+        property_value_hash: 64-char hex SHA-256 of the property value.
+        path_start_type: Starting entity type for ``path_exists`` proofs.
+        path_end_type: Ending entity type for ``path_exists`` proofs.
+        min_count: Minimum count for ``query_answer_count`` proofs.
+        actual_count: Actual (private) count for ``query_answer_count`` proofs.
+        kg_data: Optional serialised KG dict.  When supplied, the prover
+            operates over the provided graph.
+        prover_id: Stable identifier for the prover instance (used in
+            nullifier computation).  Default ``"default"``.
+        build_tdfol_witness: When ``True``, also build and return a
+            TDFOL_v1 witness dict for the Groth16 backend.  Default
+            ``False``.
+        circuit_version: TDFOL_v1 circuit version (1 or 2) used when
+            *build_tdfol_witness* is ``True``.  Default 1.
+
+    Returns:
+        Dict containing:
+
+        - ``status``: ``"success"`` or ``"error"``
+        - ``proof_type``: the proof type used
+        - ``proof``: the serialised :class:`KGProofStatement` dict
+          (``proof_type``, ``commitment``, ``nullifier``, ``parameters``,
+          ``public_inputs``, ``timestamp``)
+        - ``valid``: ``True`` if the proof was immediately verified
+        - ``tdfol_witness``: TDFOL_v1 witness dict (only when
+          *build_tdfol_witness* is ``True``)
+    """
+    try:
+        manager = KnowledgeGraphManager()
+        result = await manager.zkp_prove(
+            proof_type=proof_type,
+            entity_type=entity_type,
+            entity_name=entity_name,
+            entity_id=entity_id,
+            property_key=property_key,
+            property_value_hash=property_value_hash,
+            path_start_type=path_start_type,
+            path_end_type=path_end_type,
+            min_count=min_count,
+            actual_count=actual_count,
+            kg_data=kg_data,
+            prover_id=prover_id,
+            build_tdfol_witness=build_tdfol_witness,
+            circuit_version=circuit_version,
+        )
+        return result
+    except Exception as e:
+        logger.error("Error in graph_zkp_prove MCP tool: %s", e)
+        return {
+            "status": "error",
+            "message": str(e),
+            "proof_type": proof_type,
+            "proof": None,
+            "valid": False,
+        }
diff --git a/tests/unit/knowledge_graphs/test_master_status_session82.py b/tests/unit/knowledge_graphs/test_master_status_session82.py
index bc465678e..b02a3834e 100644
--- a/tests/unit/knowledge_graphs/test_master_status_session82.py
+++ b/tests/unit/knowledge_graphs/test_master_status_session82.py
@@ -584,8 +584,12 @@ def test_witness_builder_and_zkp_prover_compatible(self):
 # ---------------------------------------------------------------------------
 class TestDocumentationIntegrity:
     def test_master_status_has_v3_22_36(self):
-        content = _read(_MASTER)
-        assert "3.22.36" in content, "MASTER_STATUS.md should mention v3.22.36"
+        # v3.22.36 may appear in CHANGELOG but MASTER_STATUS advances to 3.22.37+
+        # Accept either MASTER_STATUS or CHANGELOG containing the version
+        ms_content = _read(_MASTER)
+        cl_content = _read(_CHANGELOG)
+        assert "3.22.36" in ms_content or "3.22.36" in cl_content, \
+            "3.22.36 should appear in MASTER_STATUS.md or CHANGELOG"
 
     def test_roadmap_has_v3_22_36(self):
         content = _read(_ROADMAP)
diff --git a/tests/unit/knowledge_graphs/test_master_status_session83.py b/tests/unit/knowledge_graphs/test_master_status_session83.py
new file mode 100644
index 000000000..00a2ce6e7
--- /dev/null
+++ b/tests/unit/knowledge_graphs/test_master_status_session83.py
@@ -0,0 +1,537 @@
+"""
+Tests for Session 83: 3 new MCP tools for GNN, ZKP, and Federation.
+
+Session 83 (v3.22.37):
+- graph_gnn_embed.py   — compute GNN node embeddings via GraphNeuralNetworkAdapter
+- graph_zkp_prove.py   — generate ZK proofs via KGZKProver + KGWitnessBuilder
+- graph_federate_query.py — query across federated KGs via FederatedKnowledgeGraph
+- 3 new KnowledgeGraphManager methods: gnn_embed / zkp_prove / federate_query
+- graph_tools/__init__.py updated (19→22 tools), README.md updated
+"""
+
+from __future__ import annotations
+
+import asyncio
+import pathlib
+import sys
+import types
+
+import pytest
+
+# ---------------------------------------------------------------------------
+# Stub anyio so the graph_tools package can be imported without it installed.
+# ---------------------------------------------------------------------------
+if "anyio" not in sys.modules:
+    sys.modules["anyio"] = types.ModuleType("anyio")
+
+# ---------------------------------------------------------------------------
+# Helpers / fixtures
+# ---------------------------------------------------------------------------
+_BASE = pathlib.Path(__file__).parent.parent.parent.parent
+_KG_ROOT = _BASE / "ipfs_datasets_py" / "knowledge_graphs"
+_MASTER = _KG_ROOT / "MASTER_STATUS.md"
+_CHANGELOG = _KG_ROOT / "CHANGELOG_KNOWLEDGE_GRAPHS.md"
+_ROADMAP = _KG_ROOT / "ROADMAP.md"
+_README_GT = (
+    _BASE / "ipfs_datasets_py" / "mcp_server" / "tools" / "graph_tools" / "README.md"
+)
+
+
+def _read(path: pathlib.Path) -> str:
+    return path.read_text(encoding="utf-8")
+
+
+def _make_kg(name="test_session83"):
+    """Build a small test KnowledgeGraph with 3 entities + 2 relationships."""
+    from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+        KnowledgeGraph,
+        Entity,
+        Relationship,
+    )
+
+    kg = KnowledgeGraph(name=name)
+    alice = Entity(entity_id="alice", entity_type="person", name="alice")
+    bob = Entity(entity_id="bob", entity_type="person", name="bob")
+    acme = Entity(entity_id="acme", entity_type="org", name="acme")
+    for e in (alice, bob, acme):
+        kg.add_entity(e)
+    kg.add_relationship(
+        Relationship(
+            relationship_id="r1",
+            relationship_type="knows",
+            source_entity=alice,
+            target_entity=bob,
+        )
+    )
+    kg.add_relationship(
+        Relationship(
+            relationship_id="r2",
+            relationship_type="works_at",
+            source_entity=alice,
+            target_entity=acme,
+        )
+    )
+    return kg
+
+
+# ===========================================================================
+# 1. MCP tool: graph_gnn_embed
+# ===========================================================================
+class TestGraphGNNEmbedTool:
+    """Tests for the graph_gnn_embed MCP tool."""
+
+    def test_import(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        assert callable(graph_gnn_embed)
+
+    def test_returns_dict(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        r = asyncio.run(graph_gnn_embed())
+        assert isinstance(r, dict)
+
+    def test_has_status(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        r = asyncio.run(graph_gnn_embed())
+        assert "status" in r
+
+    def test_empty_graph_success(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        r = asyncio.run(graph_gnn_embed())
+        assert r["status"] == "success"
+        assert r["entity_count"] == 0
+        assert r["embeddings"] == {}
+
+    def test_with_kg_data(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_gnn_embed(kg_data=kg.to_dict()))
+        assert r["status"] == "success"
+        assert r["entity_count"] == 3
+
+    def test_embeddings_keys_match_entity_ids(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_gnn_embed(kg_data=kg.to_dict()))
+        assert set(r["embeddings"].keys()) == {"alice", "bob", "acme"}
+
+    def test_embeddings_are_float_lists(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_gnn_embed(kg_data=kg.to_dict()))
+        for eid, vec in r["embeddings"].items():
+            assert isinstance(vec, list), f"{eid}: not a list"
+            assert all(isinstance(v, (int, float)) for v in vec), f"{eid}: non-numeric"
+
+    def test_top_k_similar(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_gnn_embed(kg_data=kg.to_dict(), entity_ids=["alice"], top_k_similar=2)
+        )
+        assert "alice" in r["similar"]
+        assert isinstance(r["similar"]["alice"], list)
+
+    def test_layer_type_graph_conv(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_gnn_embed(kg_data=kg.to_dict(), layer_type="graph_conv"))
+        assert r["status"] == "success"
+        assert r["layer_type"] == "graph_conv"
+
+    def test_layer_type_attention(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_gnn_embed(kg_data=kg.to_dict(), layer_type="graph_attention")
+        )
+        assert r["status"] == "success"
+
+    def test_embedding_dim_in_result(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_gnn_embed import (
+            graph_gnn_embed,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_gnn_embed(kg_data=kg.to_dict(), embedding_dim=32))
+        assert r["embedding_dim"] == 32
+
+
+# ===========================================================================
+# 2. MCP tool: graph_zkp_prove
+# ===========================================================================
+class TestGraphZKPProveTool:
+    """Tests for the graph_zkp_prove MCP tool."""
+
+    def test_import(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        assert callable(graph_zkp_prove)
+
+    def test_entity_exists_default(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(
+                proof_type="entity_exists",
+                entity_type="person",
+                entity_name="Alice",
+            )
+        )
+        assert isinstance(r, dict)
+        assert r["status"] == "success"
+
+    def test_proof_type_in_result(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(
+                proof_type="entity_exists",
+                entity_type="person",
+                entity_name="Alice",
+            )
+        )
+        assert r["proof_type"] == "entity_exists"
+
+    def test_proof_is_dict(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(proof_type="entity_exists", entity_type="org", entity_name="ACME")
+        )
+        assert isinstance(r["proof"], dict)
+
+    def test_valid_is_bool(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(proof_type="entity_exists", entity_type="person", entity_name="Bob")
+        )
+        assert isinstance(r["valid"], bool)
+
+    def test_path_exists_proof(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(
+                proof_type="path_exists",
+                path_start_type="person",
+                path_end_type="org",
+            )
+        )
+        assert r["status"] == "success"
+        assert r["proof"] is not None
+
+    def test_query_count_proof(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(
+                proof_type="query_answer_count",
+                min_count=3,
+                actual_count=5,
+            )
+        )
+        assert r["status"] == "success"
+
+    def test_build_tdfol_witness_false(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(proof_type="entity_exists", entity_type="person", entity_name="X")
+        )
+        assert "tdfol_witness" not in r
+
+    def test_build_tdfol_witness_true(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(
+                proof_type="entity_exists",
+                entity_type="person",
+                entity_name="Alice",
+                entity_id="eid_001",
+                build_tdfol_witness=True,
+            )
+        )
+        assert r["status"] == "success"
+        assert "tdfol_witness" in r
+        assert isinstance(r["tdfol_witness"], dict)
+
+    def test_tdfol_witness_has_theorem(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(
+            graph_zkp_prove(
+                proof_type="entity_exists",
+                entity_type="person",
+                entity_name="Alice",
+                entity_id="eid_001",
+                build_tdfol_witness=True,
+            )
+        )
+        assert "theorem" in r["tdfol_witness"]
+
+    def test_unknown_proof_type_returns_error(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        r = asyncio.run(graph_zkp_prove(proof_type="invalid_proof_type"))
+        assert r["status"] == "error"
+
+    def test_with_kg_data(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_zkp_prove import (
+            graph_zkp_prove,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_zkp_prove(
+                proof_type="entity_exists",
+                entity_type="person",
+                entity_name="alice",
+                kg_data=kg.to_dict(),
+            )
+        )
+        assert r["status"] == "success"
+
+
+# ===========================================================================
+# 3. MCP tool: graph_federate_query
+# ===========================================================================
+class TestGraphFederateQueryTool:
+    """Tests for the graph_federate_query MCP tool."""
+
+    def test_import(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        assert callable(graph_federate_query)
+
+    def test_empty_graphs_success(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        r = asyncio.run(graph_federate_query())
+        assert r["status"] == "success"
+        assert r["graph_count"] == 0
+
+    def test_with_two_graphs(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        kg1 = _make_kg("kg_a")
+        kg2 = _make_kg("kg_b")
+        r = asyncio.run(
+            graph_federate_query(graphs=[kg1.to_dict(), kg2.to_dict()])
+        )
+        assert r["status"] == "success"
+        assert r["graph_count"] == 2
+
+    def test_entity_matches_returned(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        kg1 = _make_kg("kg_a")
+        kg2 = _make_kg("kg_b")
+        r = asyncio.run(
+            graph_federate_query(graphs=[kg1.to_dict(), kg2.to_dict()])
+        )
+        assert "entity_matches" in r
+        assert isinstance(r["entity_matches"], list)
+
+    def test_query_entity_name(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        kg1 = _make_kg("kg_a")
+        kg2 = _make_kg("kg_b")
+        r = asyncio.run(
+            graph_federate_query(
+                graphs=[kg1.to_dict(), kg2.to_dict()],
+                query_entity_name="alice",
+            )
+        )
+        assert "query_hits" in r
+        assert len(r["query_hits"]) >= 1
+
+    def test_merge_mode(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        kg1 = _make_kg("kg_a")
+        kg2 = _make_kg("kg_b")
+        r = asyncio.run(
+            graph_federate_query(graphs=[kg1.to_dict(), kg2.to_dict()], merge=True)
+        )
+        assert r["status"] == "success"
+        assert "merged_entity_count" in r
+        assert "merged_relationship_count" in r
+
+    def test_resolution_strategy_exact_name(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        kg1 = _make_kg("kg_a")
+        r = asyncio.run(
+            graph_federate_query(
+                graphs=[kg1.to_dict()],
+                resolution_strategy="exact_name",
+            )
+        )
+        assert r["status"] == "success"
+        assert r["resolution_strategy"] == "exact_name"
+
+    def test_no_merge_no_merged_keys(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_federate_query import (
+            graph_federate_query,
+        )
+        kg1 = _make_kg("kg_a")
+        r = asyncio.run(graph_federate_query(graphs=[kg1.to_dict()], merge=False))
+        assert "merged_entity_count" not in r
+
+
+# ===========================================================================
+# 4. KnowledgeGraphManager — new methods
+# ===========================================================================
+class TestKnowledgeGraphManagerNewMethods:
+    """Tests for the 3 new KnowledgeGraphManager methods."""
+
+    def _manager(self):
+        from ipfs_datasets_py.core_operations.knowledge_graph_manager import (
+            KnowledgeGraphManager,
+        )
+        return KnowledgeGraphManager()
+
+    def test_gnn_embed_method_exists(self):
+        assert hasattr(self._manager(), "gnn_embed")
+
+    def test_zkp_prove_method_exists(self):
+        assert hasattr(self._manager(), "zkp_prove")
+
+    def test_federate_query_method_exists(self):
+        assert hasattr(self._manager(), "federate_query")
+
+    def test_gnn_embed_returns_dict(self):
+        mgr = self._manager()
+        r = asyncio.run(mgr.gnn_embed())
+        assert isinstance(r, dict)
+        assert "status" in r
+
+    def test_zkp_prove_returns_dict(self):
+        mgr = self._manager()
+        r = asyncio.run(mgr.zkp_prove(proof_type="entity_exists", entity_type="person", entity_name="Alice"))
+        assert isinstance(r, dict)
+        assert "status" in r
+
+    def test_federate_query_returns_dict(self):
+        mgr = self._manager()
+        r = asyncio.run(mgr.federate_query())
+        assert isinstance(r, dict)
+        assert "status" in r
+
+    def test_gnn_embed_with_kg(self):
+        mgr = self._manager()
+        kg = _make_kg()
+        r = asyncio.run(mgr.gnn_embed(kg_data=kg.to_dict()))
+        assert r["entity_count"] == 3
+
+    def test_zkp_prove_valid(self):
+        mgr = self._manager()
+        r = asyncio.run(
+            mgr.zkp_prove(
+                proof_type="entity_exists",
+                entity_type="person",
+                entity_name="Alice",
+            )
+        )
+        assert "valid" in r
+
+    def test_federate_query_with_kg(self):
+        mgr = self._manager()
+        kg = _make_kg()
+        r = asyncio.run(mgr.federate_query(graphs=[kg.to_dict()]))
+        assert r["graph_count"] == 1
+
+
+# ===========================================================================
+# 5. graph_tools __init__.py exports — 22 tools
+# ===========================================================================
+class TestGraphToolsExports:
+    """Tests for the updated graph_tools __init__.py."""
+
+    def test_three_new_tools_in_all(self):
+        # Import from the real package (relative imports work correctly)
+        import sys
+        import importlib
+        # Make sure the package is importable with PYTHONPATH set
+        _gt_path = str(_BASE)
+        if _gt_path not in sys.path:
+            sys.path.insert(0, _gt_path)
+        # Import __all__ from the actual module file
+        all_text = (_BASE / "ipfs_datasets_py" / "mcp_server" / "tools" / "graph_tools" / "__init__.py").read_text(encoding="utf-8")
+        for name in ("graph_gnn_embed", "graph_zkp_prove", "graph_federate_query"):
+            assert f'"{name}"' in all_text, f"{name!r} missing from __init__.py __all__"
+
+    def test_total_tools_count(self):
+        all_text = (_BASE / "ipfs_datasets_py" / "mcp_server" / "tools" / "graph_tools" / "__init__.py").read_text(encoding="utf-8")
+        # Count quoted names in __all__
+        import re
+        tool_names = re.findall(r'"(graph_\w+|query_knowledge_graph)"', all_text)
+        assert len(tool_names) >= 22, f"Expected >=22 tools, got {len(tool_names)}: {tool_names}"
+
+
+# ===========================================================================
+# 6. Documentation integrity
+# ===========================================================================
+class TestDocumentationIntegrity:
+    def test_master_status_has_v3_22_37(self):
+        content = _read(_MASTER)
+        assert "3.22.37" in content, "MASTER_STATUS.md should mention v3.22.37"
+
+    def test_roadmap_has_v3_22_37(self):
+        content = _read(_ROADMAP)
+        assert "3.22.37" in content, "ROADMAP.md should mention v3.22.37"
+
+    def test_changelog_has_session_83(self):
+        content = _read(_CHANGELOG)
+        assert "83" in content or "session83" in content.lower()
+
+    def test_readme_has_gnn_embed(self):
+        content = _read(_README_GT)
+        assert "graph_gnn_embed" in content
+
+    def test_readme_has_zkp_prove(self):
+        content = _read(_README_GT)
+        assert "graph_zkp_prove" in content
+
+    def test_readme_has_federate_query(self):
+        content = _read(_README_GT)
+        assert "graph_federate_query" in content

From 74c357d2c5629751f576d28e1fa8f07119eb98a0 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Mon, 23 Feb 2026 10:23:34 +0000
Subject: [PATCH 4/4] =?UTF-8?q?feat(knowledge=5Fgraphs):=20session=2084=20?=
 =?UTF-8?q?=E2=80=94=20graph=5Fanalytics=20+=20graph=5Flink=5Fpredict=20MC?=
 =?UTF-8?q?P=20tools=20(v3.22.38)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: endomorphosis <3405202+endomorphosis@users.noreply.github.com>
---
 .../knowledge_graph_manager.py                | 219 ++++++++
 .../CHANGELOG_KNOWLEDGE_GRAPHS.md             |  27 +
 .../knowledge_graphs/DEFERRED_FEATURES.md     |  30 ++
 .../knowledge_graphs/IMPROVEMENT_TODO.md      |   1 +
 .../knowledge_graphs/MASTER_STATUS.md         |   6 +-
 ipfs_datasets_py/knowledge_graphs/ROADMAP.md  |   3 +-
 .../mcp_server/tools/graph_tools/README.md    |   2 +
 .../mcp_server/tools/graph_tools/__init__.py  |   4 +
 .../tools/graph_tools/graph_analytics.py      |  90 ++++
 .../tools/graph_tools/graph_link_predict.py   |  94 ++++
 .../test_master_status_session83.py           |   7 +-
 .../test_master_status_session84.py           | 470 ++++++++++++++++++
 12 files changed, 947 insertions(+), 6 deletions(-)
 create mode 100644 ipfs_datasets_py/mcp_server/tools/graph_tools/graph_analytics.py
 create mode 100644 ipfs_datasets_py/mcp_server/tools/graph_tools/graph_link_predict.py
 create mode 100644 tests/unit/knowledge_graphs/test_master_status_session84.py

diff --git a/ipfs_datasets_py/core_operations/knowledge_graph_manager.py b/ipfs_datasets_py/core_operations/knowledge_graph_manager.py
index a0b912473..9edb030d4 100644
--- a/ipfs_datasets_py/core_operations/knowledge_graph_manager.py
+++ b/ipfs_datasets_py/core_operations/knowledge_graph_manager.py
@@ -1387,3 +1387,222 @@ async def federate_query(
                 "entity_matches": [],
                 "query_hits": [],
             }
+
+    async def analytics(
+        self,
+        kg_data: Optional[Dict[str, Any]] = None,
+        include_completion_analysis: bool = True,
+        include_quality_metrics: bool = True,
+        include_topology: bool = True,
+        max_completion_suggestions: int = 20,
+    ) -> Dict[str, Any]:
+        """
+        Compute comprehensive analytics for a knowledge graph.
+
+        Args:
+            kg_data: Optional serialised KG dict.
+            include_completion_analysis: Run KG completion analysis.
+            include_quality_metrics: Compute quality metrics.
+            include_topology: Compute topology statistics.
+            max_completion_suggestions: Max missing-relationship suggestions.
+
+        Returns:
+            Dict with status, entity_count, relationship_count,
+            quality_metrics, missing_relationships, isolated_entities,
+            has_completion_suggestions, and topology.
+        """
+        try:
+            from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+                KnowledgeGraph,
+            )
+            from ipfs_datasets_py.knowledge_graphs.extraction.extractor import (
+                KnowledgeGraphExtractor,
+            )
+
+            if kg_data:
+                kg = KnowledgeGraph.from_dict(kg_data)
+            else:
+                kg = KnowledgeGraph("analytics_temp")
+
+            result: Dict[str, Any] = {
+                "status": "success",
+                "entity_count": len(kg.entities),
+                "relationship_count": len(kg.relationships),
+            }
+
+            if include_quality_metrics:
+                result["quality_metrics"] = KnowledgeGraphExtractor.compute_extraction_quality_metrics(kg)
+
+            if include_completion_analysis:
+                from ipfs_datasets_py.knowledge_graphs.query.completion import (
+                    KnowledgeGraphCompleter,
+                )
+                completer = KnowledgeGraphCompleter(kg)
+                suggestions = completer.find_missing_relationships(
+                    min_score=0.3,
+                    max_suggestions=max_completion_suggestions,
+                )
+                result["missing_relationships"] = [
+                    {
+                        "source_id": s.source_id,
+                        "target_id": s.target_id,
+                        "rel_type": s.rel_type,
+                        "score": s.score,
+                        "reason": s.reason.value,
+                    }
+                    for s in suggestions
+                ]
+                result["isolated_entities"] = completer.find_isolated_entities()
+                result["has_completion_suggestions"] = len(suggestions) > 0
+
+            if include_topology:
+                # Entity type distribution
+                etype_counts: Dict[str, int] = {}
+                for e in kg.entities.values():
+                    etype_counts[e.entity_type] = etype_counts.get(e.entity_type, 0) + 1
+
+                # Relationship type distribution
+                rtype_counts: Dict[str, int] = {}
+                for r in kg.relationships.values():
+                    rtype_counts[r.relationship_type] = rtype_counts.get(r.relationship_type, 0) + 1
+
+                # Degree statistics
+                out_degree: Dict[str, int] = {}
+                in_degree: Dict[str, int] = {}
+                for r in kg.relationships.values():
+                    out_degree[r.source_id] = out_degree.get(r.source_id, 0) + 1
+                    in_degree[r.target_id] = in_degree.get(r.target_id, 0) + 1
+
+                degrees = [
+                    out_degree.get(eid, 0) + in_degree.get(eid, 0)
+                    for eid in kg.entities
+                ]
+                total_degree = sum(degrees)
+                n = len(degrees)
+                avg_degree = total_degree / n if n else 0.0
+                min_degree = min(degrees) if degrees else 0
+                max_degree = max(degrees) if degrees else 0
+
+                result["topology"] = {
+                    "entity_type_distribution": etype_counts,
+                    "relationship_type_distribution": rtype_counts,
+                    "degree_stats": {
+                        "min": min_degree,
+                        "max": max_degree,
+                        "avg": avg_degree,
+                    },
+                    "source_only_entities": sum(
+                        1 for eid in kg.entities if in_degree.get(eid, 0) == 0
+                    ),
+                    "sink_only_entities": sum(
+                        1 for eid in kg.entities if out_degree.get(eid, 0) == 0
+                    ),
+                }
+
+            return result
+        except Exception as e:
+            self.logger.error("Analytics failed: %s", e)
+            return {
+                "status": "error",
+                "message": str(e),
+                "entity_count": 0,
+                "relationship_count": 0,
+            }
+
+    async def link_predict(
+        self,
+        entity_a_id: str,
+        entity_b_id: str,
+        kg_data: Optional[Dict[str, Any]] = None,
+        layer_type: str = "graph_sage",
+        embedding_dim: int = 64,
+        num_layers: int = 2,
+        top_candidates: Optional[List[str]] = None,
+        top_k: int = 5,
+    ) -> Dict[str, Any]:
+        """
+        Compute a GNN-based link-prediction score between two entities.
+
+        Args:
+            entity_a_id: ID of the first entity.
+            entity_b_id: ID of the second entity.
+            kg_data: Optional serialised KG dict.
+            layer_type: GNN message-passing layer type.
+            embedding_dim: Embedding dimensionality.
+            num_layers: Number of message-passing iterations.
+            top_candidates: Optional entity IDs to rank against entity_a_id.
+            top_k: Max ranked predictions to return.
+
+        Returns:
+            Dict with status, entity_a_id, entity_b_id, score, prediction,
+            layer_type, embedding_dim, and optionally top_predictions.
+        """
+        try:
+            from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+                KnowledgeGraph,
+            )
+            from ipfs_datasets_py.knowledge_graphs.query.gnn import (
+                GraphNeuralNetworkAdapter,
+                GNNConfig,
+                GNNLayerType,
+            )
+
+            if kg_data:
+                kg = KnowledgeGraph.from_dict(kg_data)
+            else:
+                kg = KnowledgeGraph("link_predict_temp")
+
+            try:
+                layer = GNNLayerType(layer_type)
+            except ValueError:
+                layer = GNNLayerType.GRAPH_SAGE
+
+            config = GNNConfig(
+                embedding_dim=embedding_dim,
+                num_layers=num_layers,
+                layer_type=layer,
+            )
+            adapter = GraphNeuralNetworkAdapter(kg, config)
+            score = adapter.link_prediction_score(entity_a_id, entity_b_id)
+            prediction = "likely" if score >= 0.5 else "unlikely"
+
+            result: Dict[str, Any] = {
+                "status": "success",
+                "entity_a_id": entity_a_id,
+                "entity_b_id": entity_b_id,
+                "score": score,
+                "prediction": prediction,
+                "layer_type": layer_type,
+                "embedding_dim": embedding_dim,
+            }
+
+            if top_candidates:
+                embeddings = adapter.compute_embeddings()
+                if entity_a_id in embeddings:
+                    from ipfs_datasets_py.knowledge_graphs.query.gnn import (
+                        _cosine_similarity,
+                    )
+                    query_vec = embeddings[entity_a_id].features
+                    ranked = []
+                    for cid in top_candidates:
+                        if cid in embeddings and cid != entity_a_id:
+                            s = _cosine_similarity(
+                                query_vec, embeddings[cid].features
+                            )
+                            ranked.append({"entity_id": cid, "score": s})
+                    ranked.sort(key=lambda x: x["score"], reverse=True)
+                    result["top_predictions"] = ranked[:top_k]
+                else:
+                    result["top_predictions"] = []
+
+            return result
+        except Exception as e:
+            self.logger.error("Link predict failed: %s", e)
+            return {
+                "status": "error",
+                "message": str(e),
+                "entity_a_id": entity_a_id,
+                "entity_b_id": entity_b_id,
+                "score": 0.0,
+                "prediction": "unknown",
+            }
diff --git a/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md b/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
index 85ab4bb6b..e3fcab507 100644
--- a/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
+++ b/ipfs_datasets_py/knowledge_graphs/CHANGELOG_KNOWLEDGE_GRAPHS.md
@@ -5,6 +5,33 @@ All notable changes to the knowledge_graphs module will be documented in this fi
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [3.22.38] - 2026-02-23
+
+### Added — 2 new MCP server tools for KG analytics and link prediction (Session 84) — 42 tests
+
+**`mcp_server/tools/graph_tools/graph_analytics.py`** (new MCP tool):
+- `graph_analytics(kg_data, include_completion_analysis, include_quality_metrics, include_topology, max_completion_suggestions)` — comprehensive KG analytics
+- Quality metrics via `KnowledgeGraphExtractor.compute_extraction_quality_metrics()`
+- KG completion via `KnowledgeGraphCompleter` (missing relationships, isolated entities)
+- Topology: entity/relationship type distributions + degree statistics
+- Returns `status / entity_count / relationship_count / quality_metrics / missing_relationships / isolated_entities / topology`
+
+**`mcp_server/tools/graph_tools/graph_link_predict.py`** (new MCP tool):
+- `graph_link_predict(entity_a_id, entity_b_id, kg_data, layer_type, top_candidates, top_k)` — GNN link prediction
+- Delegates to `GraphNeuralNetworkAdapter.link_prediction_score()`
+- Optional top-k ranked candidates via cosine similarity
+- Returns `status / score / prediction ("likely"/"unlikely") / top_predictions`
+
+**`core_operations/knowledge_graph_manager.py`** (updated):
+- Added `analytics()` — full analytics pipeline
+- Added `link_predict()` — link prediction with optional top-k ranking
+
+**`mcp_server/tools/graph_tools/__init__.py`** (updated):
+- 22 → 24 tools; `graph_analytics` and `graph_link_predict` added to `__all__`
+
+**`mcp_server/tools/graph_tools/README.md`** (updated):
+- 2 new rows for session 84 tools
+
 ## [3.22.37] - 2026-02-23
 
 ### Added — 3 new MCP server tools for GNN, ZKP, and Federation (Session 83) — 48 tests
diff --git a/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md b/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
index 1ca78ff4a..a6ae62b5b 100644
--- a/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
+++ b/ipfs_datasets_py/knowledge_graphs/DEFERRED_FEATURES.md
@@ -688,6 +688,36 @@ assert kg.list_snapshots() == ["before_merge"]
 
 ---
 
+## P15: Delivered in v3.22.38 (KG analytics and link prediction MCP tools)
+
+### 32. Graph Analytics MCP Tool
+
+**Status:** ✅ Implemented (v3.22.38 — 2026-02-23)
+**Location:** `mcp_server/tools/graph_tools/graph_analytics.py` + `core_operations/knowledge_graph_manager.KnowledgeGraphManager.analytics()`
+**Implementation:**
+- `graph_analytics(kg_data, include_completion_analysis, include_quality_metrics, include_topology, max_completion_suggestions)` — comprehensive analytics
+- Quality metrics via `KnowledgeGraphExtractor.compute_extraction_quality_metrics()`
+- KG completion analysis via `KnowledgeGraphCompleter.find_missing_relationships()` + `find_isolated_entities()`
+- Topology stats: entity/relationship type distributions, degree stats, source-only + sink-only counts
+
+**Tests:** `tests/unit/knowledge_graphs/test_master_status_session84.py`
+
+---
+
+### 33. Graph Link Prediction MCP Tool
+
+**Status:** ✅ Implemented (v3.22.38 — 2026-02-23)
+**Location:** `mcp_server/tools/graph_tools/graph_link_predict.py` + `core_operations/knowledge_graph_manager.KnowledgeGraphManager.link_predict()`
+**Implementation:**
+- `graph_link_predict(entity_a_id, entity_b_id, kg_data, layer_type, top_candidates, top_k)` — GNN link prediction
+- Delegates to `GraphNeuralNetworkAdapter.link_prediction_score()` (cosine similarity of node embeddings)
+- Optional top-k ranking: cosine similarity for each candidate vs. entity_a embedding
+- Returns `score ∈ [-1, 1]` + `prediction ("likely" ≥ 0.5, "unlikely" otherwise)` + `top_predictions`
+
+**Tests:** `tests/unit/knowledge_graphs/test_master_status_session84.py`
+
+---
+
 ## P14: Delivered in v3.22.37 (MCP tools for GNN, ZKP, and Federation)
 
 ### 29. GNN Embed MCP Tool
diff --git a/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md b/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
index df6f08c8f..dbc35a2ae 100644
--- a/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
+++ b/ipfs_datasets_py/knowledge_graphs/IMPROVEMENT_TODO.md
@@ -30,6 +30,7 @@
 
 ## Session log (most recent first)
 
+- **Session 84 (2026-02-23):** 2 new MCP server tools — `graph_analytics.py` (comprehensive KG analytics: quality metrics via `KnowledgeGraphExtractor.compute_extraction_quality_metrics()`; KG completion analysis via `KnowledgeGraphCompleter`; topology stats; `KnowledgeGraphManager.analytics()`) + `graph_link_predict.py` (GNN link-prediction score between two entities via `GraphNeuralNetworkAdapter.link_prediction_score()`; optional top-k ranking; `KnowledgeGraphManager.link_predict()`); graph_tools/__init__.py 22→24 tools; README.md updated; DEFERRED_FEATURES P15 §32-33; 42 tests. v3.22.37→v3.22.38.
 - **Session 83 (2026-02-23):** 3 new MCP server tools — `graph_gnn_embed.py` (compute GNN node embeddings via `GraphNeuralNetworkAdapter`; GRAPH_CONV/SAGE/ATTENTION; top-k similar entities; `KnowledgeGraphManager.gnn_embed()`) + `graph_zkp_prove.py` (generate ZK proofs for entity_exists/path_exists/entity_property/query_answer_count; optional TDFOL_v1 witness build via `KGWitnessBuilder`; `KnowledgeGraphManager.zkp_prove()`) + `graph_federate_query.py` (cross-graph entity resolution + entity lookup + merge via `FederatedKnowledgeGraph`; type_and_name/exact_name/property_match strategies; `KnowledgeGraphManager.federate_query()`); graph_tools/__init__.py 19→22 tools; README.md updated; DEFERRED_FEATURES P14 §29–31; 48 tests. v3.22.36→v3.22.37.
 - **Session 82 (2026-02-23):** TDFOL_v1 witness builder — `query/groth16_kg_witness.py` (`KGAtomEncoder`: normalize KG strings to valid single-word TDFOL_v1 atoms via `normalize()`/`encode_entity_type()`/`encode_name()`/`encode_relationship_type()`/`encode_entity_id()`/`encode_property_key()`/`atom_for_entity()`/`atom_for_entity_exists()`/`atom_for_path_exists()`/`atom_for_entity_property()`; `KGWitnessBuilder`: build complete TDFOL_v1 witness input dicts for `entity_exists`/`path_exists`/`entity_property`/`query_answer_count` proofs; auto-computes `theorem_hash_hex`+`axioms_commitment_hex`; circuit v2 support); `KGEntityFormula.to_tdfol_atoms()` classmethod added to `groth16_bridge.py`; `query/__init__.py` + `__all__` updated; DEFERRED_FEATURES P13 §27+§28; 80 tests. v3.22.35→v3.22.36.
 - **Session 81 (2026-02-23):** 5 new MCP server tools exposing query/extraction features — `graph_graphql_query.py` (execute GraphQL query via `KnowledgeGraphQLExecutor`) + `graph_visualize.py` (DOT/Mermaid/D3 JSON/ASCII via `KnowledgeGraphVisualizer`) + `graph_complete_suggestions.py` (missing-relationship suggestions via `KnowledgeGraphCompleter`) + `graph_explain.py` (explainable-AI entity/relationship/path/why_connected via `QueryExplainer`) + `graph_provenance_verify.py` (tamper-detection via `ProvenanceChain.verify_chain()`); 5 new `KnowledgeGraphManager` async methods; `graph_tools/__init__.py` + `README.md` updated (11→19 tools); 42 tests. v3.22.34→v3.22.35.
diff --git a/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md b/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
index 91ae3f004..e2ff67db1 100644
--- a/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
+++ b/ipfs_datasets_py/knowledge_graphs/MASTER_STATUS.md
@@ -1,9 +1,9 @@
 # Knowledge Graphs Module - Master Status Document
 
-**Version:** 3.22.37  
+**Version:** 3.22.38  
 **Status:** ✅ Production Ready  
-**Last Updated:** 2026-02-23 (session 83)  
-**Last Major Release:** v3.22.37 (session 83: 3 new MCP server tools — `graph_gnn_embed` / `graph_zkp_prove` / `graph_federate_query`; 3 new `KnowledgeGraphManager` methods; `graph_tools/__init__.py` updated 19→22 tools; `README.md` updated; 48 tests)
+**Last Updated:** 2026-02-23 (session 84)  
+**Last Major Release:** v3.22.38 (session 84: 2 new MCP server tools — `graph_analytics` / `graph_link_predict`; 2 new `KnowledgeGraphManager` methods; `graph_tools/__init__.py` updated 22→24 tools; `README.md` updated; 42 tests)
 
 ---
 
diff --git a/ipfs_datasets_py/knowledge_graphs/ROADMAP.md b/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
index 272b64968..1099c59da 100644
--- a/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
+++ b/ipfs_datasets_py/knowledge_graphs/ROADMAP.md
@@ -1,7 +1,7 @@
 # Knowledge Graphs - Development Roadmap
 
 **Last Updated:** 2026-02-23  
-**Current Version:** 3.22.37  
+**Current Version:** 3.22.38  
 **Status:** Production Ready (99.99% test coverage)
 
 ---
@@ -440,6 +440,7 @@ We follow [Semantic Versioning](https://semver.org/):
 | 3.22.35 | 2026-02-23 | ✅ Released | 5 new MCP tools for query/extraction features (graph_graphql_query, graph_visualize, graph_complete_suggestions, graph_explain, graph_provenance_verify); 5 new KnowledgeGraphManager methods; graph_tools/__init__.py+README.md updated; 42 tests (session81) |
 | 3.22.36 | 2026-02-23 | ✅ Released | TDFOL_v1 witness builder: `query/groth16_kg_witness.py` (`KGAtomEncoder` normalizes KG strings to valid single-word TDFOL_v1 atoms; `KGWitnessBuilder` builds complete witness input dicts for entity_exists/path_exists/entity_property/query_answer_count proofs compatible with Groth16 Rust backend); `KGEntityFormula.to_tdfol_atoms()` classmethod added; `query/__init__.py` exports updated; 50 tests (session82) |
 | 3.22.37 | 2026-02-23 | ✅ Released | 3 new MCP server tools: `graph_gnn_embed.py` (compute GNN node embeddings via `GraphNeuralNetworkAdapter`; layer types GRAPH_CONV/SAGE/ATTENTION; top-k similar entities; embedding vectors per entity) + `graph_zkp_prove.py` (generate ZK proofs for entity_exists/path_exists/entity_property/query_answer_count; optional TDFOL_v1 witness build) + `graph_federate_query.py` (query across federated KGs via `FederatedKnowledgeGraph`; entity resolution type_and_name/exact_name/property_match; merge mode; entity lookup); 3 new `KnowledgeGraphManager` methods; graph_tools/__init__.py 19→22 tools; README.md updated; 48 tests (session83) |
+| 3.22.38 | 2026-02-23 | ✅ Released | 2 new MCP server tools: `graph_analytics.py` (comprehensive KG analytics: quality metrics, KG completion analysis, topology stats; delegates to `KnowledgeGraphExtractor.compute_extraction_quality_metrics` + `KnowledgeGraphCompleter`; `KnowledgeGraphManager.analytics()`) + `graph_link_predict.py` (GNN link-prediction score between two entities via `GraphNeuralNetworkAdapter.link_prediction_score`; top-k ranked candidates; `KnowledgeGraphManager.link_predict()`); graph_tools/__init__.py 22→24 tools; README.md updated; 42 tests (session84) |
 | 3.22.34 | 2026-02-23 | ✅ Released | ROADMAP Research Areas: Knowledge Graph Completion (query/completion.py: KnowledgeGraphCompleter; 6 structural patterns: triadic closure/common neighbour/symmetric/transitive/inverse/type-compat; CompletionSuggestion+CompletionReason) + Explainable AI (query/explanation.py: QueryExplainer; explain_entity/relationship/path/why_connected/entity_importance_score; SURFACE/STANDARD/DEEP depth; EntityExplanation/RelationshipExplanation/PathExplanation); DEFERRED_FEATURES P12 §25+§26; 52 tests (session80) |
 | 3.22.33 | 2026-02-23 | ✅ Released | Comprehensive documentation update: query/README.md v2.1.0→v3.22.33 (5 new module sections + Advanced Query Features + Recent Additions table); docs/knowledge_graphs/API_REFERENCE.md v3.22.22→v3.22.33 (Advanced Extraction APIs + Advanced Query APIs sections with examples); docs/knowledge_graphs/USER_GUIDE.md v2.0.0→v3.22.33 (§11 Future Roadmap→Delivered Features table with 15 items all ✅); 46 doc tests (session79) |
 | 3.22.32 | 2026-02-23 | ✅ Released | Groth16 Bridge: query/groth16_bridge.py (groth16_binary_available+groth16_enabled+Groth16KGConfig+KGEntityFormula+create_groth16_kg_prover+create_groth16_kg_verifier+describe_groth16_status); direct KG↔TDFOL_v1 theorem/axiom mapping; binary availability probe; 7 query/__init__.py exports; DEFERRED_FEATURES §24 Direct Groth16 Bridge subsection; 50 tests (session78) |
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md b/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md
index a5d1fc3e0..acf53390d 100644
--- a/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/README.md
@@ -30,6 +30,8 @@ The underlying graph engine supports Neo4j, in-memory, and IPLD-backed backends.
 | `graph_gnn_embed.py` | `graph_gnn_embed()` | Compute GNN node embeddings (GRAPH_CONV / SAGE / ATTENTION) *(new v3.22.37)* |
 | `graph_zkp_prove.py` | `graph_zkp_prove()` | Generate zero-knowledge proofs for KG assertions *(new v3.22.37)* |
 | `graph_federate_query.py` | `graph_federate_query()` | Query across federated knowledge graphs *(new v3.22.37)* |
+| `graph_analytics.py` | `graph_analytics()` | Comprehensive KG analytics: quality metrics, completion, topology *(new v3.22.38)* |
+| `graph_link_predict.py` | `graph_link_predict()` | GNN link-prediction score between two entities *(new v3.22.38)* |
 
 ## Usage
 
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py b/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py
index a707daf2d..59f32c640 100644
--- a/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/__init__.py
@@ -27,6 +27,8 @@
 from .graph_gnn_embed import graph_gnn_embed
 from .graph_zkp_prove import graph_zkp_prove
 from .graph_federate_query import graph_federate_query
+from .graph_analytics import graph_analytics
+from .graph_link_predict import graph_link_predict
 
 __all__ = [
     "query_knowledge_graph",
@@ -51,4 +53,6 @@
     "graph_gnn_embed",
     "graph_zkp_prove",
     "graph_federate_query",
+    "graph_analytics",
+    "graph_link_predict",
 ]
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_analytics.py b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_analytics.py
new file mode 100644
index 000000000..451b48d69
--- /dev/null
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_analytics.py
@@ -0,0 +1,90 @@
+"""
+MCP tool for comprehensive knowledge-graph analytics.
+
+Thin wrapper around KnowledgeGraphManager.analytics().
+Core implementation: ipfs_datasets_py.core_operations.knowledge_graph_manager
+"""
+
+import logging
+from typing import Any, Dict, Optional
+
+logger = logging.getLogger(__name__)
+
+from ipfs_datasets_py.core_operations import KnowledgeGraphManager
+
+
+async def graph_analytics(
+    kg_data: Optional[Dict[str, Any]] = None,
+    include_completion_analysis: bool = True,
+    include_quality_metrics: bool = True,
+    include_topology: bool = True,
+    max_completion_suggestions: int = 20,
+) -> Dict[str, Any]:
+    """
+    Compute comprehensive analytics for a knowledge graph.
+
+    Aggregates multiple analysis passes into a single report:
+
+    **Quality metrics** (from :func:`~extraction.extractor.KnowledgeGraphExtractor.compute_extraction_quality_metrics`):
+    entity count, relationship count, relationship density, average
+    entity/relationship confidence, confidence std-dev, low-confidence ratio,
+    entity-type diversity, relationship-type diversity, isolated-entity ratio.
+
+    **KG completion analysis** (from :class:`~query.completion.KnowledgeGraphCompleter`):
+    top missing-relationship suggestions (sorted by score), isolated entity IDs,
+    and a graph-level completeness indicator.
+
+    **Topology** (pure graph computation):
+    entity-type distribution, relationship-type distribution, degree statistics
+    (min/max/avg), number of entities with in-degree=0, number with out-degree=0.
+
+    Args:
+        kg_data: Optional serialised knowledge-graph dict (from ``kg.to_dict()``).
+            When ``None`` an empty in-memory graph is used.
+        include_completion_analysis: When ``True`` (default), run KG completion
+            pattern analysis and return ``missing_relationships`` +
+            ``isolated_entities`` + ``has_completion_suggestions``.
+        include_quality_metrics: When ``True`` (default), compute and return
+            ``quality_metrics`` (confidence, density, diversity, etc.).
+        include_topology: When ``True`` (default), compute and return
+            ``topology`` (degree stats, type distributions).
+        max_completion_suggestions: Maximum number of missing-relationship
+            suggestions to return.  Default 20.
+
+    Returns:
+        Dict containing:
+
+        - ``status``: ``"success"`` or ``"error"``
+        - ``entity_count``: total entities
+        - ``relationship_count``: total relationships
+        - ``quality_metrics``: quality-metrics dict (only when
+          *include_quality_metrics* is ``True``)
+        - ``missing_relationships``: list of ``{"source_id", "target_id",
+          "rel_type", "score", "reason"}`` dicts (only when
+          *include_completion_analysis* is ``True``)
+        - ``isolated_entities``: list of entity IDs with no relationships
+          (only when *include_completion_analysis* is ``True``)
+        - ``has_completion_suggestions``: ``True`` when the graph has at least
+          one missing-relationship suggestion
+        - ``topology``: topology dict with ``entity_type_distribution``,
+          ``relationship_type_distribution``, ``degree_stats``
+          (only when *include_topology* is ``True``)
+    """
+    try:
+        manager = KnowledgeGraphManager()
+        result = await manager.analytics(
+            kg_data=kg_data,
+            include_completion_analysis=include_completion_analysis,
+            include_quality_metrics=include_quality_metrics,
+            include_topology=include_topology,
+            max_completion_suggestions=max_completion_suggestions,
+        )
+        return result
+    except Exception as e:
+        logger.error("Error in graph_analytics MCP tool: %s", e)
+        return {
+            "status": "error",
+            "message": str(e),
+            "entity_count": 0,
+            "relationship_count": 0,
+        }
diff --git a/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_link_predict.py b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_link_predict.py
new file mode 100644
index 000000000..d897147db
--- /dev/null
+++ b/ipfs_datasets_py/mcp_server/tools/graph_tools/graph_link_predict.py
@@ -0,0 +1,94 @@
+"""
+MCP tool for GNN-based link prediction between two knowledge-graph entities.
+
+Thin wrapper around KnowledgeGraphManager.link_predict().
+Core implementation: ipfs_datasets_py.core_operations.knowledge_graph_manager
+"""
+
+import logging
+from typing import Any, Dict, List, Optional
+
+logger = logging.getLogger(__name__)
+
+from ipfs_datasets_py.core_operations import KnowledgeGraphManager
+
+
+async def graph_link_predict(
+    entity_a_id: str,
+    entity_b_id: str,
+    kg_data: Optional[Dict[str, Any]] = None,
+    layer_type: str = "graph_sage",
+    embedding_dim: int = 64,
+    num_layers: int = 2,
+    top_candidates: Optional[List[str]] = None,
+    top_k: int = 5,
+) -> Dict[str, Any]:
+    """
+    Compute a GNN-based link-prediction score between two knowledge-graph entities.
+
+    Uses :class:`~query.gnn.GraphNeuralNetworkAdapter` to generate node embeddings
+    via graph message-passing, then measures the cosine similarity of the two
+    entity embedding vectors as a link-prediction score.
+
+    A score near **1.0** means the two entities are highly similar in graph
+    context (i.e. they connect to the same neighbours, share types, etc.) and
+    a link between them is strongly predicted.  A score near **0.0** means the
+    entities occupy very different graph neighbourhoods and a link is unlikely.
+
+    Optionally, instead of scoring a single pair you can request the top-*k*
+    predicted link partners for *entity_a_id* from a list of *top_candidates*.
+
+    Args:
+        entity_a_id: ID of the first entity.
+        entity_b_id: ID of the second entity (used for the pair score).
+        kg_data: Optional serialised knowledge-graph dict.  When ``None``,
+            an empty in-memory graph is used and the result will have
+            ``score=0.0``.
+        layer_type: GNN message-passing layer type; one of ``"graph_conv"``,
+            ``"graph_sage"`` *(default)*, ``"graph_attention"``.
+        embedding_dim: Embedding dimensionality (default 64).
+        num_layers: Number of message-passing iterations (default 2).
+        top_candidates: Optional list of entity IDs to rank against
+            *entity_a_id*.  When provided, the tool also returns
+            ``top_predictions`` — the top-*k* candidates sorted by
+            link-prediction score.
+        top_k: Maximum number of ranked predictions to return when
+            *top_candidates* is given (default 5).
+
+    Returns:
+        Dict containing:
+
+        - ``status``: ``"success"`` or ``"error"``
+        - ``entity_a_id``: first entity ID
+        - ``entity_b_id``: second entity ID
+        - ``score``: cosine-similarity link-prediction score ∈ [-1, 1]
+        - ``prediction``: ``"likely"`` when score ≥ 0.5, ``"unlikely"``
+          otherwise
+        - ``top_predictions``: list of ``{"entity_id": str, "score": float}``
+          (only when *top_candidates* supplied)
+        - ``layer_type``: the GNN layer type used
+        - ``embedding_dim``: the embedding dimension used
+    """
+    try:
+        manager = KnowledgeGraphManager()
+        result = await manager.link_predict(
+            entity_a_id=entity_a_id,
+            entity_b_id=entity_b_id,
+            kg_data=kg_data,
+            layer_type=layer_type,
+            embedding_dim=embedding_dim,
+            num_layers=num_layers,
+            top_candidates=top_candidates,
+            top_k=top_k,
+        )
+        return result
+    except Exception as e:
+        logger.error("Error in graph_link_predict MCP tool: %s", e)
+        return {
+            "status": "error",
+            "message": str(e),
+            "entity_a_id": entity_a_id,
+            "entity_b_id": entity_b_id,
+            "score": 0.0,
+            "prediction": "unknown",
+        }
diff --git a/tests/unit/knowledge_graphs/test_master_status_session83.py b/tests/unit/knowledge_graphs/test_master_status_session83.py
index 00a2ce6e7..6a5200096 100644
--- a/tests/unit/knowledge_graphs/test_master_status_session83.py
+++ b/tests/unit/knowledge_graphs/test_master_status_session83.py
@@ -513,8 +513,11 @@ def test_total_tools_count(self):
 # ===========================================================================
 class TestDocumentationIntegrity:
     def test_master_status_has_v3_22_37(self):
-        content = _read(_MASTER)
-        assert "3.22.37" in content, "MASTER_STATUS.md should mention v3.22.37"
+        # v3.22.37 may appear in CHANGELOG but MASTER_STATUS advances to 3.22.38+
+        ms_content = _read(_MASTER)
+        cl_content = _read(_CHANGELOG)
+        assert "3.22.37" in ms_content or "3.22.37" in cl_content, \
+            "3.22.37 should appear in MASTER_STATUS.md or CHANGELOG"
 
     def test_roadmap_has_v3_22_37(self):
         content = _read(_ROADMAP)
diff --git a/tests/unit/knowledge_graphs/test_master_status_session84.py b/tests/unit/knowledge_graphs/test_master_status_session84.py
new file mode 100644
index 000000000..8645452d0
--- /dev/null
+++ b/tests/unit/knowledge_graphs/test_master_status_session84.py
@@ -0,0 +1,470 @@
+"""
+Tests for Session 84: graph_analytics + graph_link_predict MCP tools (v3.22.38).
+
+Session 84 (v3.22.38):
+- graph_analytics.py  — comprehensive KG analytics (quality, completion, topology)
+- graph_link_predict.py — GNN link-prediction score between two entities
+- 2 new KnowledgeGraphManager methods: analytics / link_predict
+- graph_tools/__init__.py updated (22→24 tools), README.md updated
+"""
+
+from __future__ import annotations
+
+import asyncio
+import pathlib
+import sys
+import types
+
+import pytest
+
+# Stub anyio so graph_tools can be imported without it installed.
+if "anyio" not in sys.modules:
+    sys.modules["anyio"] = types.ModuleType("anyio")
+
+_BASE = pathlib.Path(__file__).parent.parent.parent.parent
+_KG_ROOT = _BASE / "ipfs_datasets_py" / "knowledge_graphs"
+_MASTER = _KG_ROOT / "MASTER_STATUS.md"
+_CHANGELOG = _KG_ROOT / "CHANGELOG_KNOWLEDGE_GRAPHS.md"
+_ROADMAP = _KG_ROOT / "ROADMAP.md"
+_README_GT = (
+    _BASE / "ipfs_datasets_py" / "mcp_server" / "tools" / "graph_tools" / "README.md"
+)
+
+
+def _read(path: pathlib.Path) -> str:
+    return path.read_text(encoding="utf-8")
+
+
+def _make_kg(name="session84_kg"):
+    """Build a 4-entity KG with 3 relationships."""
+    from ipfs_datasets_py.knowledge_graphs.extraction.graph import (
+        KnowledgeGraph,
+        Entity,
+        Relationship,
+    )
+
+    kg = KnowledgeGraph(name=name)
+    alice = Entity(entity_id="alice", entity_type="person", name="alice", confidence=0.9)
+    bob = Entity(entity_id="bob", entity_type="person", name="bob", confidence=0.8)
+    acme = Entity(entity_id="acme", entity_type="org", name="acme", confidence=1.0)
+    solo = Entity(entity_id="solo", entity_type="person", name="solo", confidence=0.7)
+
+    for e in (alice, bob, acme, solo):
+        kg.add_entity(e)
+
+    kg.add_relationship(
+        Relationship(
+            relationship_id="r1",
+            relationship_type="knows",
+            source_entity=alice,
+            target_entity=bob,
+        )
+    )
+    kg.add_relationship(
+        Relationship(
+            relationship_id="r2",
+            relationship_type="works_at",
+            source_entity=alice,
+            target_entity=acme,
+        )
+    )
+    kg.add_relationship(
+        Relationship(
+            relationship_id="r3",
+            relationship_type="works_at",
+            source_entity=bob,
+            target_entity=acme,
+        )
+    )
+    return kg
+
+
+# ===========================================================================
+# 1. graph_analytics MCP tool
+# ===========================================================================
+class TestGraphAnalyticsTool:
+    """Tests for the graph_analytics MCP tool."""
+
+    def test_import(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        assert callable(graph_analytics)
+
+    def test_empty_graph_success(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        r = asyncio.run(graph_analytics())
+        assert isinstance(r, dict)
+        assert r["status"] == "success"
+
+    def test_entity_count(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict()))
+        assert r["entity_count"] == 4
+
+    def test_relationship_count(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict()))
+        assert r["relationship_count"] == 3
+
+    def test_quality_metrics_present(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict(), include_quality_metrics=True))
+        assert "quality_metrics" in r
+        assert isinstance(r["quality_metrics"], dict)
+
+    def test_quality_metrics_keys(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict()))
+        qm = r["quality_metrics"]
+        for key in ("entity_count", "relationship_count", "relationship_density",
+                    "avg_entity_confidence", "avg_relationship_confidence"):
+            assert key in qm, f"{key!r} missing from quality_metrics"
+
+    def test_completion_analysis_present(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_analytics(kg_data=kg.to_dict(), include_completion_analysis=True)
+        )
+        assert "missing_relationships" in r
+        assert "isolated_entities" in r
+        assert "has_completion_suggestions" in r
+
+    def test_isolated_entities_found(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict()))
+        # "solo" has no relationships
+        assert "solo" in r["isolated_entities"]
+
+    def test_topology_present(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict(), include_topology=True))
+        assert "topology" in r
+        topo = r["topology"]
+        assert "entity_type_distribution" in topo
+        assert "relationship_type_distribution" in topo
+        assert "degree_stats" in topo
+
+    def test_topology_entity_types(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict()))
+        topo = r["topology"]
+        # 3 persons + 1 org
+        assert topo["entity_type_distribution"].get("person", 0) == 3
+        assert topo["entity_type_distribution"].get("org", 0) == 1
+
+    def test_topology_degree_stats_keys(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict()))
+        ds = r["topology"]["degree_stats"]
+        for k in ("min", "max", "avg"):
+            assert k in ds, f"{k!r} missing from degree_stats"
+
+    def test_no_quality_metrics_when_disabled(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        r = asyncio.run(graph_analytics(include_quality_metrics=False))
+        assert "quality_metrics" not in r
+
+    def test_no_completion_when_disabled(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        r = asyncio.run(graph_analytics(include_completion_analysis=False))
+        assert "missing_relationships" not in r
+
+    def test_no_topology_when_disabled(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        r = asyncio.run(graph_analytics(include_topology=False))
+        assert "topology" not in r
+
+    def test_missing_relationships_list(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_analytics(kg_data=kg.to_dict()))
+        assert isinstance(r["missing_relationships"], list)
+
+    def test_max_completion_suggestions_respected(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_analytics import (
+            graph_analytics,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_analytics(kg_data=kg.to_dict(), max_completion_suggestions=2)
+        )
+        assert len(r["missing_relationships"]) <= 2
+
+
+# ===========================================================================
+# 2. graph_link_predict MCP tool
+# ===========================================================================
+class TestGraphLinkPredictTool:
+    """Tests for the graph_link_predict MCP tool."""
+
+    def test_import(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        assert callable(graph_link_predict)
+
+    def test_returns_dict(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        r = asyncio.run(graph_link_predict("alice", "bob"))
+        assert isinstance(r, dict)
+
+    def test_has_status(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_link_predict("alice", "bob", kg_data=kg.to_dict()))
+        assert r["status"] == "success"
+
+    def test_entity_ids_in_result(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_link_predict("alice", "bob", kg_data=kg.to_dict()))
+        assert r["entity_a_id"] == "alice"
+        assert r["entity_b_id"] == "bob"
+
+    def test_score_is_float(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_link_predict("alice", "bob", kg_data=kg.to_dict()))
+        assert isinstance(r["score"], float)
+
+    def test_prediction_field(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_link_predict("alice", "bob", kg_data=kg.to_dict()))
+        assert r["prediction"] in ("likely", "unlikely")
+
+    def test_missing_entity_score_zero(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_link_predict("alice", "nonexistent_entity", kg_data=kg.to_dict())
+        )
+        assert r["score"] == 0.0
+
+    def test_layer_type_returned(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_link_predict("alice", "bob", kg_data=kg.to_dict(), layer_type="graph_conv")
+        )
+        assert r["layer_type"] == "graph_conv"
+
+    def test_embedding_dim_returned(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_link_predict("alice", "bob", kg_data=kg.to_dict(), embedding_dim=32)
+        )
+        assert r["embedding_dim"] == 32
+
+    def test_num_layers_accepted(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_link_predict("alice", "bob", kg_data=kg.to_dict(), num_layers=3)
+        )
+        assert r["status"] == "success"
+        assert isinstance(r["score"], float)
+
+    def test_top_candidates_returns_list(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_link_predict(
+                "alice",
+                "bob",
+                kg_data=kg.to_dict(),
+                top_candidates=["bob", "acme", "solo"],
+                top_k=3,
+            )
+        )
+        assert "top_predictions" in r
+        assert isinstance(r["top_predictions"], list)
+        assert len(r["top_predictions"]) <= 3
+
+    def test_top_predictions_have_score(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(
+            graph_link_predict(
+                "alice",
+                "bob",
+                kg_data=kg.to_dict(),
+                top_candidates=["bob", "acme", "solo"],
+            )
+        )
+        for pred in r["top_predictions"]:
+            assert "entity_id" in pred
+            assert "score" in pred
+            assert isinstance(pred["score"], float)
+
+    def test_no_top_candidates_no_top_predictions(self):
+        from ipfs_datasets_py.mcp_server.tools.graph_tools.graph_link_predict import (
+            graph_link_predict,
+        )
+        kg = _make_kg()
+        r = asyncio.run(graph_link_predict("alice", "bob", kg_data=kg.to_dict()))
+        assert "top_predictions" not in r
+
+
+# ===========================================================================
+# 3. KnowledgeGraphManager new methods
+# ===========================================================================
+class TestKnowledgeGraphManagerSession84:
+    """Tests for analytics / link_predict KnowledgeGraphManager methods."""
+
+    def _manager(self):
+        from ipfs_datasets_py.core_operations.knowledge_graph_manager import (
+            KnowledgeGraphManager,
+        )
+        return KnowledgeGraphManager()
+
+    def test_analytics_method_exists(self):
+        assert hasattr(self._manager(), "analytics")
+
+    def test_link_predict_method_exists(self):
+        assert hasattr(self._manager(), "link_predict")
+
+    def test_analytics_returns_dict(self):
+        r = asyncio.run(self._manager().analytics())
+        assert isinstance(r, dict)
+        assert "status" in r
+
+    def test_link_predict_returns_dict(self):
+        r = asyncio.run(self._manager().link_predict("a", "b"))
+        assert isinstance(r, dict)
+        assert "status" in r
+
+    def test_analytics_with_kg(self):
+        kg = _make_kg()
+        r = asyncio.run(self._manager().analytics(kg_data=kg.to_dict()))
+        assert r["entity_count"] == 4
+        assert r["relationship_count"] == 3
+
+    def test_link_predict_with_kg(self):
+        kg = _make_kg()
+        r = asyncio.run(
+            self._manager().link_predict("alice", "bob", kg_data=kg.to_dict())
+        )
+        assert r["status"] == "success"
+        assert "score" in r
+
+    def test_analytics_quality_metrics_has_avg_confidence(self):
+        kg = _make_kg()
+        r = asyncio.run(self._manager().analytics(kg_data=kg.to_dict()))
+        qm = r["quality_metrics"]
+        assert "avg_entity_confidence" in qm
+        assert 0.0 <= qm["avg_entity_confidence"] <= 1.0
+
+
+# ===========================================================================
+# 4. graph_tools __init__.py exports — 24 tools
+# ===========================================================================
+class TestGraphToolsExports84:
+    """Tests for the updated graph_tools __init__.py (22→24 tools)."""
+
+    def test_new_tools_in_init(self):
+        init_text = (
+            _BASE
+            / "ipfs_datasets_py"
+            / "mcp_server"
+            / "tools"
+            / "graph_tools"
+            / "__init__.py"
+        ).read_text(encoding="utf-8")
+        for name in ("graph_analytics", "graph_link_predict"):
+            assert f'"{name}"' in init_text, f"{name!r} missing from __init__.py"
+
+    def test_total_tools_at_least_24(self):
+        import re
+        init_text = (
+            _BASE
+            / "ipfs_datasets_py"
+            / "mcp_server"
+            / "tools"
+            / "graph_tools"
+            / "__init__.py"
+        ).read_text(encoding="utf-8")
+        tool_names = re.findall(r'"(graph_\w+|query_knowledge_graph)"', init_text)
+        assert len(tool_names) >= 24, f"Expected >=24 tools, got {len(tool_names)}"
+
+
+# ===========================================================================
+# 5. Documentation integrity
+# ===========================================================================
+class TestDocumentationIntegrity84:
+    def test_master_status_has_v3_22_38(self):
+        assert "3.22.38" in _read(_MASTER), "MASTER_STATUS.md should mention v3.22.38"
+
+    def test_roadmap_has_v3_22_38(self):
+        assert "3.22.38" in _read(_ROADMAP), "ROADMAP.md should mention v3.22.38"
+
+    def test_changelog_has_session_84(self):
+        content = _read(_CHANGELOG)
+        assert "3.22.38" in content or "session84" in content.lower() or "Session 84" in content
+
+    def test_readme_has_graph_analytics(self):
+        assert "graph_analytics" in _read(_README_GT)
+
+    def test_readme_has_graph_link_predict(self):
+        assert "graph_link_predict" in _read(_README_GT)