Made knoweldge graphs first-class parts of domain packs.

2026-03-16 17:46:33 -04:00 · 2026-03-16 17:46:33 -04:00 · 41ca57d60f
parent 51dd2b29ff
commit 41ca57d60f
16 changed files with 6294 additions and 5 deletions
--- a/docs/course-to-pack.md
+++ b/docs/course-to-pack.md
@ -51,11 +51,17 @@ The pack emitter writes:
 - `conflict_report.md`
 - `license_attribution.json`
 - `source_corpus.json`
 - `knowledge_graph.json`
 `source_corpus.json` is the main grounded-text artifact. It preserves lesson bodies, objectives,
 exercises, and source references from the ingested material so downstream tutoring or evaluation
 can rely on source-derived text instead of only the distilled concept graph.
 `knowledge_graph.json` is the graph-first artifact. It preserves typed nodes and justified edges
 for sources, modules, lessons, concepts, assessment signals, and prerequisite/support relations.
 Later Didactopus retrieval and tutoring flows can use this graph to explain why a concept appears,
 what supports it, and which source material grounds it.
 ## Rule layer
 The current default rules:
--- a/domain-packs/mit-ocw-information-entropy/knowledge_graph.json
+++ b/domain-packs/mit-ocw-information-entropy/knowledge_graph.json
--- a/domain-packs/mit-ocw-information-entropy/pack.yaml
+++ b/domain-packs/mit-ocw-information-entropy/pack.yaml
@ -14,3 +14,4 @@ profile_templates: {}
 cross_pack_links: []
 supporting_artifacts:
 - source_corpus.json
 - knowledge_graph.json
--- a/skills/ocw-information-entropy-agent/assets/generated/pack/knowledge_graph.json
+++ b/skills/ocw-information-entropy-agent/assets/generated/pack/knowledge_graph.json
--- a/skills/ocw-information-entropy-agent/assets/generated/pack/pack.yaml
+++ b/skills/ocw-information-entropy-agent/assets/generated/pack/pack.yaml
@ -14,3 +14,4 @@ profile_templates: {}
 cross_pack_links: []
 supporting_artifacts:
 - source_corpus.json
 - knowledge_graph.json
--- a/skills/ocw-information-entropy-agent/assets/generated/run/run_summary.json
+++ b/skills/ocw-information-entropy-agent/assets/generated/run/run_summary.json
@ -11,6 +11,12 @@
  ],
  "concept_count": 34,
  "source_fragment_count": 60,
  "knowledge_graph_summary": {
    "node_count": 98,
    "edge_count": 178,
    "concept_count": 34,
    "source_count": 3
  },
  "target_concept": "mit-ocw-information-and-entropy::thermodynamics-and-entropy",
  "curriculum_path": [
    "mit-ocw-information-and-entropy::mit-ocw-6-050j-information-and-entropy-course-home",
--- a/src/didactopus/graph_retrieval.py
+++ b/src/didactopus/graph_retrieval.py
@ -0,0 +1,91 @@
 from __future__ import annotations
 from dataclasses import dataclass
@dataclass
 class GraphBundle:
    knowledge_graph: dict
    source_corpus: dict
 def concept_node_id(concept_id: str) -> str:
    return f"concept::{concept_id}"
 def _node_index(bundle: GraphBundle) -> dict[str, dict]:
    return {node["id"]: node for node in bundle.knowledge_graph.get("nodes", [])}
 def _edges(bundle: GraphBundle) -> list[dict]:
    return list(bundle.knowledge_graph.get("edges", []))
 def get_concept_node(bundle: GraphBundle, concept_id: str) -> dict | None:
    return _node_index(bundle).get(concept_node_id(concept_id))
 def concept_neighborhood(bundle: GraphBundle, concept_id: str) -> dict:
    node_id = concept_node_id(concept_id)
    nodes = _node_index(bundle)
    incoming = []
    outgoing = []
    for edge in _edges(bundle):
        if edge["target"] == node_id:
            incoming.append(edge)
        if edge["source"] == node_id:
            outgoing.append(edge)
    return {
        "concept": nodes.get(node_id, {}),
        "incoming": incoming,
        "outgoing": outgoing,
        "incoming_nodes": [nodes[edge["source"]] for edge in incoming if edge["source"] in nodes],
        "outgoing_nodes": [nodes[edge["target"]] for edge in outgoing if edge["target"] in nodes],
    }
 def source_fragments_for_concept(bundle: GraphBundle, concept_id: str, limit: int = 3) -> list[dict]:
    neighborhood = concept_neighborhood(bundle, concept_id)
    lesson_titles = {
        node.get("title", "")
        for node in neighborhood["incoming_nodes"]
        if node.get("type") == "lesson"
    }
    lesson_titles.update(
        node.get("title", "")
        for node in neighborhood["outgoing_nodes"]
        if node.get("type") == "lesson"
    )
    fragments = []
    for fragment in bundle.source_corpus.get("fragments", []):
        if fragment.get("lesson_title") in lesson_titles:
            fragments.append(fragment)
        if len(fragments) >= limit:
            break
    return fragments
 def prerequisite_titles(bundle: GraphBundle, concept_id: str) -> list[str]:
    neighborhood = concept_neighborhood(bundle, concept_id)
    titles = []
    seen = set()
    for edge, node in zip(neighborhood["incoming"], neighborhood["incoming_nodes"]):
        if edge.get("type") == "prerequisite":
            title = node.get("title", node.get("id", ""))
            if title not in seen:
                seen.add(title)
                titles.append(title)
    return titles
 def lesson_titles_for_concept(bundle: GraphBundle, concept_id: str) -> list[str]:
    neighborhood = concept_neighborhood(bundle, concept_id)
    titles = []
    seen = set()
    for edge, node in zip(neighborhood["incoming"], neighborhood["incoming_nodes"]):
        if edge.get("type") in {"supports_concept", "teaches_concept"} and node.get("type") == "lesson":
            title = node.get("title", node.get("id", ""))
            if title not in seen:
                seen.add(title)
                titles.append(title)
    return titles
--- a/src/didactopus/knowledge_graph.py
+++ b/src/didactopus/knowledge_graph.py
@ -0,0 +1,219 @@
 from __future__ import annotations
 import json
 import re
 from pathlib import Path
 from .course_schema import ConceptCandidate, NormalizedCourse
 def _slugify(text: str) -> str:
    cleaned = re.sub(r"[^a-zA-Z0-9]+", "-", text.strip().lower()).strip("-")
    return cleaned or "untitled"
 def _source_node_id(source_path: str) -> str:
    return f"source::{_slugify(source_path)}"
 def _module_node_id(module_title: str) -> str:
    return f"module::{_slugify(module_title)}"
 def _lesson_node_id(module_title: str, lesson_title: str) -> str:
    return f"lesson::{_slugify(module_title)}::{_slugify(lesson_title)}"
 def _concept_node_id(concept_id: str) -> str:
    return f"concept::{concept_id}"
 def _signal_node_id(kind: str, lesson_title: str, idx: int) -> str:
    return f"{kind}::{_slugify(lesson_title)}::{idx}"
 def _add_node(nodes: dict[str, dict], node_id: str, node_type: str, **attrs) -> None:
    node = nodes.setdefault(node_id, {"id": node_id, "type": node_type})
    for key, value in attrs.items():
        if value not in (None, "", [], {}):
            node[key] = value
 def _add_edge(edges: list[dict], source: str, target: str, edge_type: str, justification: str, provenance: list[str] | None = None, confidence: float = 1.0) -> None:
    edges.append(
        {
            "source": source,
            "target": target,
            "type": edge_type,
            "justification": justification,
            "provenance": list(provenance or []),
            "confidence": confidence,
        }
    )
 def build_knowledge_graph(course: NormalizedCourse, concepts: list[ConceptCandidate]) -> dict:
    nodes: dict[str, dict] = {}
    edges: list[dict] = []
    for source in course.source_records:
        source_id = _source_node_id(source.source_path)
        _add_node(
            nodes,
            source_id,
            "source",
            title=source.title or source.source_path,
            source_path=source.source_path,
            source_type=source.source_type,
            metadata=getattr(source, "metadata", {}),
        )
    concept_ids = {concept.id for concept in concepts}
    for concept in concepts:
        concept_node_id = _concept_node_id(concept.id)
        _add_node(
            nodes,
            concept_node_id,
            "concept",
            title=concept.title,
            description=concept.description,
            source_modules=list(concept.source_modules),
            source_lessons=list(concept.source_lessons),
            source_courses=list(concept.source_courses),
            mastery_signals=list(concept.mastery_signals),
        )
    for module in course.modules:
        module_id = _module_node_id(module.title)
        _add_node(nodes, module_id, "module", title=module.title)
        for lesson in module.lessons:
            lesson_id = _lesson_node_id(module.title, lesson.title)
            _add_node(
                nodes,
                lesson_id,
                "lesson",
                title=lesson.title,
                module_title=module.title,
                body=lesson.body,
                source_refs=list(lesson.source_refs),
                key_terms=list(lesson.key_terms),
            )
            _add_edge(
                edges,
                module_id,
                lesson_id,
                "contains_lesson",
                justification=f"Lesson '{lesson.title}' appears under module '{module.title}'.",
                provenance=list(lesson.source_refs),
            )
            for source_ref in lesson.source_refs:
                source_id = _source_node_id(source_ref)
                if source_id in nodes:
                    _add_edge(
                        edges,
                        source_id,
                        lesson_id,
                        "derived_lesson",
                        justification=f"Lesson '{lesson.title}' was ingested from source '{source_ref}'.",
                        provenance=[source_ref],
                    )
            for idx, objective in enumerate(lesson.objectives, start=1):
                objective_id = _signal_node_id("objective", lesson.title, idx)
                _add_node(nodes, objective_id, "assessment_signal", title=objective, signal_kind="objective")
                _add_edge(
                    edges,
                    lesson_id,
                    objective_id,
                    "has_objective",
                    justification=f"Objective {idx} was extracted from lesson '{lesson.title}'.",
                    provenance=list(lesson.source_refs),
                )
            for idx, exercise in enumerate(lesson.exercises, start=1):
                exercise_id = _signal_node_id("exercise", lesson.title, idx)
                _add_node(nodes, exercise_id, "assessment_signal", title=exercise, signal_kind="exercise")
                _add_edge(
                    edges,
                    lesson_id,
                    exercise_id,
                    "has_exercise",
                    justification=f"Exercise {idx} was extracted from lesson '{lesson.title}'.",
                    provenance=list(lesson.source_refs),
                )
            lesson_concept_id = _concept_node_id(_slugify(lesson.title))
            if lesson_concept_id in nodes:
                _add_edge(
                    edges,
                    lesson_id,
                    lesson_concept_id,
                    "teaches_concept",
                    justification=f"Lesson '{lesson.title}' yields the lesson-level concept '{lesson.title}'.",
                    provenance=list(lesson.source_refs),
                )
            for term in lesson.key_terms:
                term_id = _concept_node_id(_slugify(term))
                if term_id in nodes:
                    _add_edge(
                        edges,
                        lesson_id,
                        term_id,
                        "mentions_concept",
                        justification=f"Key term '{term}' was extracted from lesson '{lesson.title}'.",
                        provenance=list(lesson.source_refs),
                        confidence=0.7,
                    )
    for concept in concepts:
        concept_node_id = _concept_node_id(concept.id)
        for prereq in concept.prerequisites:
            prereq_id = _concept_node_id(prereq)
            if prereq_id in nodes:
                _add_edge(
                    edges,
                    prereq_id,
                    concept_node_id,
                    "prerequisite",
                    justification=f"Concept '{concept.title}' depends on prerequisite '{prereq}'.",
                    provenance=list(concept.source_courses),
                    confidence=0.85,
                )
        for lesson_title in concept.source_lessons:
            lesson_sources = [module.title for module in course.modules if any(lesson.title == lesson_title for lesson in module.lessons)]
            for module in course.modules:
                for lesson in module.lessons:
                    if lesson.title != lesson_title:
                        continue
                    lesson_id = _lesson_node_id(module.title, lesson.title)
                    if concept_node_id in nodes and lesson_id in nodes:
                        _add_edge(
                            edges,
                            lesson_id,
                            concept_node_id,
                            "supports_concept",
                            justification=f"Concept '{concept.title}' was extracted from lesson '{lesson.title}'.",
                            provenance=list(lesson.source_refs),
                            confidence=0.9 if concept.id == _slugify(lesson.title) else 0.7,
                        )
    return {
        "course_title": course.title,
        "rights_note": course.rights_note,
        "summary": {
            "node_count": len(nodes),
            "edge_count": len(edges),
            "concept_count": len(concepts),
            "source_count": len(course.source_records),
        },
        "nodes": list(nodes.values()),
        "edges": edges,
    }
 def write_knowledge_graph(course: NormalizedCourse, concepts: list[ConceptCandidate], outdir: str | Path) -> None:
    out = Path(outdir)
    out.mkdir(parents=True, exist_ok=True)
    payload = build_knowledge_graph(course, concepts)
    (out / "knowledge_graph.json").write_text(json.dumps(payload, indent=2), encoding="utf-8")
--- a/src/didactopus/ocw_information_entropy_demo.py
+++ b/src/didactopus/ocw_information_entropy_demo.py
@ -15,6 +15,7 @@ from .mastery_ledger import (
    export_capability_profile_json,
    export_capability_report_markdown,
 )
 from .knowledge_graph import write_knowledge_graph
 from .pack_emitter import build_draft_pack, write_draft_pack, write_source_corpus
 from .rule_policy import RuleContext, build_default_rules, run_rules
 from .topic_ingest import build_topic_bundle, document_to_course, extract_concept_candidates, merge_courses_into_topic_course
@ -167,6 +168,7 @@ def run_ocw_information_entropy_demo(
    )
    write_draft_pack(draft, pack_dir)
    write_source_corpus(merged, pack_dir)
    write_knowledge_graph(merged, ctx.concepts, pack_dir)
    if source_inventory.exists():
        inventory = load_sources(source_inventory)
        compliance_manifest = build_pack_compliance_manifest(draft.pack["name"], draft.pack["display_name"], inventory)
@ -210,6 +212,7 @@ def run_ocw_information_entropy_demo(
        "review_flags": list(ctx.review_flags),
        "concept_count": len(ctx.concepts),
        "source_fragment_count": len(json.loads((pack_dir / "source_corpus.json").read_text(encoding="utf-8")).get("fragments", [])),
        "knowledge_graph_summary": json.loads((pack_dir / "knowledge_graph.json").read_text(encoding="utf-8")).get("summary", {}),
        "target_concept": target_key,
        "curriculum_path": concept_path,
        "mastered_concepts": sorted(state.mastered_concepts),
--- a/src/didactopus/ocw_rolemesh_transcript_demo.py
+++ b/src/didactopus/ocw_rolemesh_transcript_demo.py
@ -5,6 +5,7 @@ from pathlib import Path
 import sys
 from .config import load_config
 from .graph_retrieval import lesson_titles_for_concept, prerequisite_titles, source_fragments_for_concept
 from .model_provider import ModelProvider
 from .ocw_skill_agent_demo import load_ocw_skill_context
 from .role_prompts import evaluator_system_prompt, learner_system_prompt, mentor_system_prompt, practice_system_prompt
@ -153,6 +154,34 @@ def _path_titles(context, limit: int | None = None) -> list[str]:
    return titles[:limit] if limit is not None else titles
 def _concept_by_title(context, title: str) -> dict | None:
    lowered = title.strip().lower()
    for concept in context.concepts:
        if str(concept.get("title", "")).strip().lower() == lowered:
            return concept
    return None
 def _grounding_text_for_title(context, title: str) -> str:
    concept = _concept_by_title(context, title)
    if concept is None:
        return ""
    concept_id = concept.get("id", "")
    prereqs = prerequisite_titles(context.graph_bundle, concept_id)
    lessons = lesson_titles_for_concept(context.graph_bundle, concept_id)
    fragments = source_fragments_for_concept(context.graph_bundle, concept_id, limit=2)
    fragment_lines = [fragment.get("text", "") for fragment in fragments if fragment.get("text")]
    lines = [
        f"Concept focus: {title}",
        f"Prerequisites: {', '.join(prereqs) if prereqs else 'none explicit'}",
        f"Supporting lessons: {', '.join(lessons) if lessons else title}",
    ]
    if fragment_lines:
        lines.append("Grounding fragments:")
        lines.extend(f"- {line}" for line in fragment_lines)
    return "\n".join(lines)
 def _healthy_rolemesh_models(provider: ModelProvider) -> set[str]:
    config = provider.config
    if config.provider.lower() != "rolemesh":
@ -240,6 +269,8 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
    mentor_guidance = _generate_checked(
        provider,
        f"{_grounding_text_for_title(context, path_titles[1])}\n\n"
        f"{_grounding_text_for_title(context, path_titles[2])}\n\n"
        "Given the learner reflection, explain the first two concepts to study from the generated path and why. "
        f"Path reference: {path_titles[:4]}",
        role="mentor",
@ -254,6 +285,8 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
    practice_task = _generate_checked(
        provider,
        f"{_grounding_text_for_title(context, path_titles[1])}\n\n"
        f"{_grounding_text_for_title(context, path_titles[2])}\n\n"
        "Generate one short practice task that forces the learner to connect counting/probability with Shannon entropy, "
        "without giving away the full answer.",
        role="practice",
@ -282,6 +315,7 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
    evaluator_feedback = _generate_checked(
        provider,
        f"{_grounding_text_for_title(context, path_titles[2])}\n\n"
        "Evaluate this learner attempt for correctness, explanation quality, and limitations. "
        f"Task: {practice_task}\nAttempt: {learner_attempt}",
        role="evaluator",
@ -296,6 +330,7 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
    mentor_next_step = _generate_checked(
        provider,
        f"{_grounding_text_for_title(context, 'Channel Capacity')}\n\n"
        "Given the evaluator feedback, tell the learner what to do next before moving on to channel capacity. "
        "Use the course path to show what comes next.",
        role="mentor",
@ -313,18 +348,21 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
            "topic": "Channel Capacity",
            "path_slice": path_titles[4:7] or path_titles,
            "practice_anchor": "binary symmetric channel",
            "grounding_title": "Channel Capacity",
            "required_terms": ["channel", "capacity", "entropy", "noise"],
        },
        {
            "topic": "Coding and Compression",
            "path_slice": path_titles[5:9] or path_titles,
            "practice_anchor": "compression and error-correcting code",
            "grounding_title": "Source Coding and Compression",
            "required_terms": ["coding", "compression", "redundancy", "error"],
        },
        {
            "topic": "Thermodynamic Entropy and Synthesis",
            "path_slice": path_titles[8:] or path_titles,
            "practice_anchor": "thermodynamic entropy",
            "grounding_title": "Thermodynamics and Entropy",
            "required_terms": ["thermodynamic", "entropy", "information", "physical"],
        },
    ]
@ -332,6 +370,7 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
    for stage in stage_specs:
        mentor_stage = _generate_checked(
            provider,
            f"{_grounding_text_for_title(context, stage['grounding_title'])}\n\n"
            f"The learner is continuing through the MIT OCW Information and Entropy course. "
            f"Bridge from the previous work into {stage['topic']}. "
            f"Reference this path segment: {stage['path_slice']}. "
@ -362,6 +401,7 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
        practice_stage = _generate_checked(
            provider,
            f"{_grounding_text_for_title(context, stage['grounding_title'])}\n\n"
            f"Create one short reasoning task about {stage['practice_anchor']} for the learner. "
            "Keep it course-relevant and do not provide the full solution.",
            role="practice",
@ -376,6 +416,7 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
        evaluator_stage = _generate_checked(
            provider,
            f"{_grounding_text_for_title(context, stage['grounding_title'])}\n\n"
            f"Give short evaluator feedback on this learner reflection in the context of {stage['topic']}: "
            f"{learner_stage}\nTask context: {practice_stage}",
            role="evaluator",
@ -393,6 +434,7 @@ def build_ocw_rolemesh_transcript(config_path: str | Path, skill_dir: str | Path
        "skill": context.skill_name,
        "course": context.pack.get("display_name", context.pack.get("name", "")),
        "curriculum_path_titles": path_titles,
        "graph_grounding_summary": context.run_summary.get("knowledge_graph_summary", {}),
        "role_fallbacks": role_fallbacks,
        "status_updates": status_updates,
        "transcript": turns,
--- a/src/didactopus/ocw_skill_agent_demo.py
+++ b/src/didactopus/ocw_skill_agent_demo.py
@ -7,6 +7,7 @@ from pathlib import Path
 import yaml
 from .evaluator_pipeline import CritiqueEvaluator, LearnerAttempt, RubricEvaluator, SymbolicRuleEvaluator, aggregate, run_pipeline
 from .graph_retrieval import GraphBundle, lesson_titles_for_concept, prerequisite_titles, source_fragments_for_concept
@dataclass
@ -17,6 +18,7 @@ class SkillContext:
    capability_summary: str
    pack: dict
    concepts: list[dict]
    graph_bundle: GraphBundle
    capability_profile: dict
    run_summary: dict
@ -46,6 +48,10 @@ def load_ocw_skill_context(skill_dir: str | Path) -> SkillContext:
        capability_summary=(skill_dir / "references" / "generated-capability-summary.md").read_text(encoding="utf-8"),
        pack=yaml.safe_load((pack_dir / "pack.yaml").read_text(encoding="utf-8")) or {},
        concepts=(yaml.safe_load((pack_dir / "concepts.yaml").read_text(encoding="utf-8")) or {}).get("concepts", []),
        graph_bundle=GraphBundle(
            knowledge_graph=json.loads((pack_dir / "knowledge_graph.json").read_text(encoding="utf-8")),
            source_corpus=json.loads((pack_dir / "source_corpus.json").read_text(encoding="utf-8")),
        ),
        capability_profile=json.loads((run_dir / "capability_profile.json").read_text(encoding="utf-8")),
        run_summary=json.loads((run_dir / "run_summary.json").read_text(encoding="utf-8")),
    )
@ -88,8 +94,16 @@ def build_skill_grounded_study_plan(context: SkillContext, target_task: str) ->
                "concept_key": concept_key,
                "title": concept["title"],
                "status": "mastered" if concept_key in context.capability_profile.get("mastered_concepts", []) else "review-needed",
-                "prerequisites": [
+                "prerequisites": [_concept_key(pack_name, prereq) for prereq in concept.get("prerequisites", [])],
-                    _concept_key(pack_name, prereq) for prereq in concept.get("prerequisites", [])
+                "prerequisite_titles": prerequisite_titles(context.graph_bundle, concept_id),
                "supporting_lessons": lesson_titles_for_concept(context.graph_bundle, concept_id),
                "source_fragments": [
                    {
                        "lesson_title": fragment.get("lesson_title", ""),
                        "kind": fragment.get("kind", ""),
                        "text": fragment.get("text", ""),
                    }
                    for fragment in source_fragments_for_concept(context.graph_bundle, concept_id, limit=2)
                ],
                "recommended_action": (
                    f"Use {concept['title']} as the primary teaching anchor."
@ -115,10 +129,14 @@ def build_skill_grounded_explanation(context: SkillContext, concept_id: str) ->
    concept_key = _concept_key(pack_name, concept_id)
    summary = context.capability_profile.get("evaluator_summary_by_concept", {}).get(concept_key, {})
    prereqs = prerequisite_titles(context.graph_bundle, concept_id)
    lessons = lesson_titles_for_concept(context.graph_bundle, concept_id)
    fragments = source_fragments_for_concept(context.graph_bundle, concept_id, limit=2)
    explanation = (
        f"{concept['title']} is represented in the Information and Entropy skill as part of a progression from "
        f"foundational probability ideas toward communication limits and physical interpretation. "
-        f"It depends on {', '.join(concept.get('prerequisites', []) or ['no explicit prerequisites in the generated pack'])}. "
+        f"It depends on {', '.join(prereqs or concept.get('prerequisites', []) or ['no explicit prerequisites in the generated pack'])}. "
        f"It is grounded by lessons such as {', '.join(lessons or [concept['title']])}. "
        f"The current demo learner already mastered this concept, with evaluator means {summary}, so the skill can use it as a stable explanation anchor."
    )
    return {
@ -126,6 +144,17 @@ def build_skill_grounded_explanation(context: SkillContext, concept_id: str) ->
        "title": concept["title"],
        "explanation": explanation,
        "source_description": concept.get("description", ""),
        "grounding": {
            "supporting_lessons": lessons,
            "source_fragments": [
                {
                    "lesson_title": fragment.get("lesson_title", ""),
                    "kind": fragment.get("kind", ""),
                    "text": fragment.get("text", ""),
                }
                for fragment in fragments
            ],
        },
    }
@ -154,6 +183,7 @@ def evaluate_submission_with_skill(context: SkillContext, concept_id: str, submi
        "skill_reference": {
            "skill_name": context.skill_name,
            "mastered_by_demo_agent": mastered_reference,
            "supporting_lessons": lesson_titles_for_concept(context.graph_bundle, concept_id),
        },
        "follow_up": (
            "Extend the answer with an explicit limitation or assumption."
@ -205,6 +235,7 @@ def run_ocw_skill_agent_demo(skill_dir: str | Path, out_dir: str | Path) -> dict
            "",
            "## Explanation Demo",
            explanation["explanation"],
            f"- Supporting lessons: {explanation['grounding']['supporting_lessons']}",
            "",
            "## Evaluation Demo",
            f"- Verdict: {evaluation['verdict']}",
--- a/src/didactopus/pack_emitter.py
+++ b/src/didactopus/pack_emitter.py
@ -87,7 +87,7 @@ def build_draft_pack(
        "overrides": [],
        "profile_templates": {},
        "cross_pack_links": [],
-        "supporting_artifacts": ["source_corpus.json"],
+        "supporting_artifacts": ["source_corpus.json", "knowledge_graph.json"],
    }
    concepts_yaml = {
        "concepts": [
--- a/tests/test_knowledge_graph.py
+++ b/tests/test_knowledge_graph.py
@ -0,0 +1,44 @@
 from pathlib import Path
 import json
 from didactopus.course_ingest import parse_markdown_course, extract_concept_candidates
 from didactopus.knowledge_graph import build_knowledge_graph, write_knowledge_graph
 from didactopus.rule_policy import RuleContext, build_default_rules, run_rules
 SAMPLE = """
 # Sample Course
 ## Module 1
 ### Lesson A
 - Objective: Explain Topic A.
 - Exercise: Do task A.
 Topic A body.
 ### Lesson B
 - Objective: Explain Topic B.
 Lesson B body.
 """
 def test_build_knowledge_graph_contains_typed_nodes_and_edges(tmp_path: Path) -> None:
    course = parse_markdown_course(SAMPLE, "Sample Course")
    concepts = extract_concept_candidates(course)
    ctx = RuleContext(course=course, concepts=concepts)
    run_rules(ctx, build_default_rules())
    payload = build_knowledge_graph(course, ctx.concepts)
    node_types = {node["type"] for node in payload["nodes"]}
    edge_types = {edge["type"] for edge in payload["edges"]}
    assert payload["summary"]["concept_count"] >= 2
    assert "source" in node_types
    assert "lesson" in node_types
    assert "concept" in node_types
    assert "assessment_signal" in node_types
    assert "contains_lesson" in edge_types
    assert "teaches_concept" in edge_types or "supports_concept" in edge_types
    write_knowledge_graph(course, ctx.concepts, tmp_path)
    written = json.loads((tmp_path / "knowledge_graph.json").read_text(encoding="utf-8"))
    assert written["summary"]["node_count"] >= len(payload["nodes"])
--- a/tests/test_ocw_rolemesh_transcript_demo.py
+++ b/tests/test_ocw_rolemesh_transcript_demo.py
@ -28,11 +28,13 @@ def test_ocw_rolemesh_transcript_demo_writes_artifacts(tmp_path: Path) -> None:
    assert payload["provider"] == "stub"
    assert len(payload["transcript"]) >= 16
    assert len(payload["curriculum_path_titles"]) >= 8
    assert payload["graph_grounding_summary"]["node_count"] >= 1
    assert payload["role_fallbacks"] == {}
    assert payload["status_updates"] == []
    assert any(turn["speaker"] == "Didactopus Evaluator" for turn in payload["transcript"])
    assert any("channel" in turn["content"].lower() for turn in payload["transcript"])
    assert any("thermodynamic" in turn["content"].lower() for turn in payload["transcript"])
    assert any("supporting lessons" in turn["content"].lower() or "grounding fragments" in turn["content"].lower() for turn in payload["transcript"])
    assert all(not _looks_truncated(turn["content"]) for turn in payload["transcript"])
    assert (tmp_path / "rolemesh_transcript.json").exists()
    assert (tmp_path / "rolemesh_transcript.md").exists()
--- a/tests/test_ocw_skill_agent_demo.py
+++ b/tests/test_ocw_skill_agent_demo.py
@ -17,6 +17,9 @@ def test_run_ocw_skill_agent_demo(tmp_path: Path) -> None:
    assert (tmp_path / "skill_demo.json").exists()
    assert (tmp_path / "skill_demo.md").exists()
    assert payload["study_plan"]["steps"]
    assert payload["study_plan"]["steps"][0]["supporting_lessons"]
    assert "grounding" in payload["explanation"]
    assert payload["explanation"]["grounding"]["supporting_lessons"]
    assert payload["evaluation"]["verdict"] in {"acceptable", "needs_revision"}
@ -30,4 +33,5 @@ def test_skill_demo_flags_weak_submission() -> None:
    )
    assert result["verdict"] == "needs_revision"
    assert result["skill_reference"]["supporting_lessons"]
    assert "Rework the answer" in result["follow_up"]
--- a/tests/test_pack_emitter.py
+++ b/tests/test_pack_emitter.py
@ -1,7 +1,8 @@
 from pathlib import Path
 from didactopus.course_ingest import parse_markdown_course, extract_concept_candidates
 from didactopus.knowledge_graph import write_knowledge_graph
 from didactopus.rule_policy import RuleContext, build_default_rules, run_rules
-from didactopus.pack_emitter import build_draft_pack, write_draft_pack
+from didactopus.pack_emitter import build_draft_pack, write_draft_pack, write_source_corpus
 SAMPLE = '''
 # Sample Course
@ -20,5 +21,9 @@ def test_emit_pack(tmp_path: Path) -> None:
    run_rules(ctx, build_default_rules())
    draft = build_draft_pack(course, ctx.concepts, "Tester", "REVIEW", ctx.review_flags)
    write_draft_pack(draft, tmp_path)
    write_source_corpus(course, tmp_path)
    write_knowledge_graph(course, ctx.concepts, tmp_path)
    assert (tmp_path / "pack.yaml").exists()
    assert (tmp_path / "review_report.md").exists()
    assert (tmp_path / "source_corpus.json").exists()
    assert (tmp_path / "knowledge_graph.json").exists()