diff --git a/crates/plotnik-lib/src/bytecode/dump.rs b/crates/plotnik-lib/src/bytecode/dump.rs
new file mode 100644
index 00000000..01fec032
--- /dev/null
+++ b/crates/plotnik-lib/src/bytecode/dump.rs
@@ -0,0 +1,560 @@
+//! Human-readable bytecode dump for debugging and documentation.
+//!
+//! See `docs/wip/bytecode.md` for the output format specification.
+
+use std::collections::BTreeMap;
+use std::fmt::Write as _;
+
+use super::effects::EffectOpcode;
+use super::ids::{QTypeId, StepId, StringId};
+use super::module::{Instruction, Module};
+use super::nav::Nav;
+use super::type_meta::TypeKind;
+use super::{Call, Match, Return};
+
+/// Generate a human-readable dump of the bytecode module.
+pub fn dump(module: &Module) -> String {
+    let mut out = String::new();
+    let ctx = DumpContext::new(module);
+
+    dump_header(&mut out, module);
+    dump_strings(&mut out, module);
+    dump_types_defs(&mut out, module, &ctx);
+    dump_types_members(&mut out, module, &ctx);
+    dump_types_names(&mut out, module, &ctx);
+    dump_entrypoints(&mut out, module, &ctx);
+    dump_code(&mut out, module, &ctx);
+
+    out
+}
+
+fn dump_header(out: &mut String, module: &Module) {
+    let header = module.header();
+    out.push_str("[header]\n");
+    writeln!(out, "linked = {}", header.is_linked()).unwrap();
+    out.push('\n');
+}
+
+/// Context for dump formatting, precomputes lookups for O(1) access.
+struct DumpContext {
+    /// Whether the bytecode is linked (contains grammar IDs vs StringIds).
+    is_linked: bool,
+    /// Maps step ID to entrypoint name for labeling.
+    step_labels: BTreeMap<u16, String>,
+    /// Maps node type ID to name (linked mode only).
+    node_type_names: BTreeMap<u16, String>,
+    /// Maps node field ID to name (linked mode only).
+    node_field_names: BTreeMap<u16, String>,
+    /// Entrypoint names by index (for Return formatting).
+    entrypoint_names: Vec<String>,
+    /// All strings (for unlinked mode lookups).
+    all_strings: Vec<String>,
+}
+
+impl DumpContext {
+    fn new(module: &Module) -> Self {
+        let header = module.header();
+        let is_linked = header.is_linked();
+        let strings = module.strings();
+        let entrypoints = module.entrypoints();
+        let node_types = module.node_types();
+        let node_fields = module.node_fields();
+
+        let mut step_labels = BTreeMap::new();
+        let mut entrypoint_names = Vec::with_capacity(entrypoints.len());
+        for i in 0..entrypoints.len() {
+            let ep = entrypoints.get(i);
+            let name = strings.get(ep.name).to_string();
+            step_labels.insert(ep.target.0, name.clone());
+            entrypoint_names.push(name);
+        }
+
+        let mut node_type_names = BTreeMap::new();
+        for i in 0..node_types.len() {
+            let t = node_types.get(i);
+            node_type_names.insert(t.id, strings.get(t.name).to_string());
+        }
+
+        let mut node_field_names = BTreeMap::new();
+        for i in 0..node_fields.len() {
+            let f = node_fields.get(i);
+            node_field_names.insert(f.id, strings.get(f.name).to_string());
+        }
+
+        // Collect all strings for unlinked mode lookups
+        let str_count = header.str_table_count as usize;
+        let all_strings: Vec<String> = (0..str_count)
+            .map(|i| strings.get(StringId(i as u16)).to_string())
+            .collect();
+
+        Self {
+            is_linked,
+            step_labels,
+            node_type_names,
+            node_field_names,
+            entrypoint_names,
+            all_strings,
+        }
+    }
+
+    fn label_for(&self, step: StepId) -> Option<&str> {
+        self.step_labels.get(&step.0).map(|s| s.as_str())
+    }
+
+    /// Get the name for a node type ID.
+    ///
+    /// In linked mode, this looks up the grammar's node type symbol table.
+    /// In unlinked mode, this looks up the StringId from the strings table.
+    fn node_type_name(&self, id: u16) -> Option<&str> {
+        if self.is_linked {
+            self.node_type_names.get(&id).map(|s| s.as_str())
+        } else {
+            // In unlinked mode, id is a StringId
+            self.all_strings.get(id as usize).map(|s| s.as_str())
+        }
+    }
+
+    /// Get the name for a node field ID.
+    ///
+    /// In linked mode, this looks up the grammar's node field symbol table.
+    /// In unlinked mode, this looks up the StringId from the strings table.
+    fn node_field_name(&self, id: u16) -> Option<&str> {
+        if self.is_linked {
+            self.node_field_names.get(&id).map(|s| s.as_str())
+        } else {
+            // In unlinked mode, id is a StringId
+            self.all_strings.get(id as usize).map(|s| s.as_str())
+        }
+    }
+
+    fn entrypoint_name(&self, index: usize) -> Option<&str> {
+        self.entrypoint_names.get(index).map(|s| s.as_str())
+    }
+}
+
+fn dump_strings(out: &mut String, module: &Module) {
+    let strings = module.strings();
+    let count = module.header().str_table_count as usize;
+
+    out.push_str("[strings]\n");
+    for i in 0..count {
+        let s = strings.get(StringId(i as u16));
+        writeln!(out, "S{i:02} {s:?}").unwrap();
+    }
+    out.push('\n');
+}
+
+fn dump_types_defs(out: &mut String, module: &Module, ctx: &DumpContext) {
+    let types = module.types();
+    let strings = module.strings();
+
+    out.push_str("[types.defs]\n");
+
+    // Builtins (T00-T02)
+    out.push_str("T00 = void\n");
+    out.push_str("T01 = Node\n");
+    out.push_str("T02 = str\n");
+
+    // Custom types (T03+)
+    for i in 0..types.defs_count() {
+        let def = types.get_def(i);
+        let type_id = i + 3; // Custom types start at index 3
+
+        let kind = def.type_kind().expect("valid type kind");
+        let formatted = match kind {
+            TypeKind::Struct => format!("Struct(M{}, {})", def.data, def.count),
+            TypeKind::Enum => format!("Enum(M{}, {})", def.data, def.count),
+            TypeKind::Optional => format!("Optional(T{:02})", def.data),
+            TypeKind::ArrayZeroOrMore => format!("ArrayStar(T{:02})", def.data),
+            TypeKind::ArrayOneOrMore => format!("ArrayPlus(T{:02})", def.data),
+            TypeKind::Alias => format!("Alias(T{:02})", def.data),
+        };
+
+        // Generate comment for composites
+        let comment = match kind {
+            TypeKind::Struct => {
+                let fields: Vec<_> = types
+                    .members_of(&def)
+                    .map(|m| strings.get(m.name).to_string())
+                    .collect();
+                format!("  ; {{ {} }}", fields.join(", "))
+            }
+            TypeKind::Enum => {
+                let variants: Vec<_> = types
+                    .members_of(&def)
+                    .map(|m| strings.get(m.name).to_string())
+                    .collect();
+                format!("  ; {}", variants.join(" | "))
+            }
+            TypeKind::Optional => {
+                let inner_name = format_type_name(QTypeId(def.data), module, ctx);
+                format!("  ; {}?", inner_name)
+            }
+            TypeKind::ArrayZeroOrMore => {
+                let inner_name = format_type_name(QTypeId(def.data), module, ctx);
+                format!("  ; {}*", inner_name)
+            }
+            TypeKind::ArrayOneOrMore => {
+                let inner_name = format_type_name(QTypeId(def.data), module, ctx);
+                format!("  ; {}+", inner_name)
+            }
+            TypeKind::Alias => String::new(),
+        };
+
+        writeln!(out, "T{type_id:02} = {formatted}{comment}").unwrap();
+    }
+    out.push('\n');
+}
+
+fn dump_types_members(out: &mut String, module: &Module, ctx: &DumpContext) {
+    let types = module.types();
+    let strings = module.strings();
+
+    out.push_str("[types.members]\n");
+    for i in 0..types.members_count() {
+        let member = types.get_member(i);
+        let name = strings.get(member.name);
+        let type_name = format_type_name(member.type_id, module, ctx);
+        writeln!(
+            out,
+            "M{i} = (S{:02}, T{:02})  ; {name}: {type_name}",
+            member.name.0, member.type_id.0
+        )
+        .unwrap();
+    }
+    out.push('\n');
+}
+
+fn dump_types_names(out: &mut String, module: &Module, _ctx: &DumpContext) {
+    let types = module.types();
+    let strings = module.strings();
+
+    out.push_str("[types.names]\n");
+    for i in 0..types.names_count() {
+        let entry = types.get_name(i);
+        let name = strings.get(entry.name);
+        writeln!(
+            out,
+            "N{i} = (S{:02}, T{:02})  ; {name}",
+            entry.name.0, entry.type_id.0
+        )
+        .unwrap();
+    }
+    out.push('\n');
+}
+
+/// Format a type ID as a human-readable name.
+fn format_type_name(type_id: QTypeId, module: &Module, _ctx: &DumpContext) -> String {
+    if type_id.is_builtin() {
+        return match type_id.0 {
+            0 => "void".to_string(),
+            1 => "Node".to_string(),
+            2 => "str".to_string(),
+            _ => unreachable!(),
+        };
+    }
+
+    // Try to find a name in types.names
+    let types = module.types();
+    let strings = module.strings();
+
+    for i in 0..types.names_count() {
+        let entry = types.get_name(i);
+        if entry.type_id == type_id {
+            return strings.get(entry.name).to_string();
+        }
+    }
+
+    // Fall back to T## format
+    format!("T{:02}", type_id.0)
+}
+
+fn dump_entrypoints(out: &mut String, module: &Module, _ctx: &DumpContext) {
+    let strings = module.strings();
+    let entrypoints = module.entrypoints();
+
+    out.push_str("[entry]\n");
+
+    // Collect and sort by name for display
+    let mut entries: Vec<_> = (0..entrypoints.len())
+        .map(|i| {
+            let ep = entrypoints.get(i);
+            let name = strings.get(ep.name);
+            (name, ep.target.0, ep.result_type.0)
+        })
+        .collect();
+    entries.sort_by_key(|(name, _, _)| *name);
+
+    // Find max name length for alignment
+    let max_len = entries.iter().map(|(n, _, _)| n.len()).max().unwrap_or(0);
+
+    for (name, target, type_id) in entries {
+        writeln!(
+            out,
+            "{name:width$} = {:02} :: T{type_id:02}",
+            target,
+            width = max_len
+        )
+        .unwrap();
+    }
+    out.push('\n');
+}
+
+fn dump_code(out: &mut String, module: &Module, ctx: &DumpContext) {
+    let header = module.header();
+    let transitions_count = header.transitions_count as usize;
+
+    // Calculate step number width based on total steps
+    let step_width = if transitions_count == 0 {
+        2
+    } else {
+        ((transitions_count as f64).log10().floor() as usize + 1).max(2)
+    };
+
+    out.push_str("[code]\n");
+
+    let mut step = 0u16;
+    while (step as usize) < transitions_count {
+        // Check if this step has a label
+        if let Some(label) = ctx.label_for(StepId(step)) {
+            writeln!(out, "\n{label}:").unwrap();
+        }
+
+        let instr = module.decode_step(StepId(step));
+        let line = format_instruction(step, &instr, module, ctx, step_width);
+        out.push_str(&line);
+        out.push('\n');
+
+        // Advance by instruction size
+        let size = instruction_step_count(&instr);
+        step += size;
+    }
+}
+
+/// Pad a base string to a target column width, then append a suffix.
+fn pad_to_column(base: String, col: usize, suffix: &str) -> String {
+    let padding = col.saturating_sub(base.chars().count());
+    format!("{base}{:padding$}{suffix}", "")
+}
+
+fn instruction_step_count(instr: &Instruction) -> u16 {
+    match instr {
+        Instruction::Match(m) => {
+            let slots = m.pre_effects.len()
+                + m.neg_fields.len()
+                + m.post_effects.len()
+                + m.successors.len();
+
+            if m.pre_effects.is_empty()
+                && m.neg_fields.is_empty()
+                && m.post_effects.is_empty()
+                && m.successors.len() <= 1
+            {
+                1 // Match8
+            } else if slots <= 4 {
+                2 // Match16
+            } else if slots <= 8 {
+                3 // Match24
+            } else if slots <= 12 {
+                4 // Match32
+            } else if slots <= 20 {
+                6 // Match48
+            } else {
+                8 // Match64
+            }
+        }
+        Instruction::Call(_) | Instruction::Return(_) => 1,
+    }
+}
+
+fn format_instruction(
+    step: u16,
+    instr: &Instruction,
+    module: &Module,
+    ctx: &DumpContext,
+    step_width: usize,
+) -> String {
+    match instr {
+        Instruction::Match(m) => format_match(step, m, module, ctx, step_width),
+        Instruction::Call(c) => format_call(step, c, module, ctx, step_width),
+        Instruction::Return(r) => format_return(step, r, module, ctx, step_width),
+    }
+}
+
+fn format_match(
+    step: u16,
+    m: &Match,
+    _module: &Module,
+    ctx: &DumpContext,
+    step_width: usize,
+) -> String {
+    // Nav column: 7 chars total for content alignment
+    // 𝜀 (epsilon) centered for Stay, others left-aligned with 2-char gap
+    let nav_col = if m.nav == Nav::Stay {
+        "   𝜀   ".to_string()
+    } else {
+        let sym = format_nav(m.nav);
+        let sym_len = sym.chars().count();
+        let gap2 = 7usize.saturating_sub(2 + sym_len).max(1);
+        format!("  {sym}{:gap2$}", "")
+    };
+
+    let mut content_parts = Vec::new();
+
+    // Pre-effects
+    if !m.pre_effects.is_empty() {
+        let effects: Vec<_> = m.pre_effects.iter().map(format_effect).collect();
+        content_parts.push(format!("[{}]", effects.join(" ")));
+    }
+
+    // Negated fields
+    for &field_id in &m.neg_fields {
+        let name = ctx
+            .node_field_name(field_id)
+            .map(|s| s.to_string())
+            .unwrap_or_else(|| format!("field#{field_id}"));
+        content_parts.push(format!("!{name}"));
+    }
+
+    // Field constraint and node type
+    let mut node_part = String::new();
+
+    if let Some(field_id) = m.node_field {
+        let name = ctx
+            .node_field_name(field_id.get())
+            .map(|s| s.to_string())
+            .unwrap_or_else(|| format!("field#{}", field_id.get()));
+        node_part.push_str(&name);
+        node_part.push_str(": ");
+    }
+
+    if let Some(type_id) = m.node_type {
+        let name = ctx
+            .node_type_name(type_id.get())
+            .map(|s| s.to_string())
+            .unwrap_or_else(|| format!("node#{}", type_id.get()));
+        node_part.push('(');
+        node_part.push_str(&name);
+        node_part.push(')');
+    } else if m.node_field.is_some() {
+        node_part.push('_');
+    }
+
+    if !node_part.is_empty() {
+        content_parts.push(node_part);
+    }
+
+    // Post-effects
+    if !m.post_effects.is_empty() {
+        let effects: Vec<_> = m.post_effects.iter().map(format_effect).collect();
+        content_parts.push(format!("[{}]", effects.join(" ")));
+    }
+
+    // Successors
+    let succ_str = if m.successors.is_empty() {
+        "◼".to_string()
+    } else {
+        m.successors
+            .iter()
+            .map(|s| format_step(*s, ctx, step_width))
+            .collect::<Vec<_>>()
+            .join(", ")
+    };
+
+    let content = content_parts.join(" ");
+    let base = if content.is_empty() {
+        format!("  {:0sw$}{nav_col}", step, sw = step_width)
+    } else {
+        format!("  {:0sw$}{nav_col}{content}", step, sw = step_width)
+    };
+    pad_to_column(base, 44, &succ_str)
+}
+
+fn format_call(
+    step: u16,
+    c: &Call,
+    _module: &Module,
+    ctx: &DumpContext,
+    step_width: usize,
+) -> String {
+    let target_name = ctx
+        .label_for(c.target)
+        .map(|s| s.to_string())
+        .unwrap_or_else(|| format!("@{:0w$}", c.target.0, w = step_width));
+
+    let base = format!("  {:0w$}   ▶   ({target_name})", step, w = step_width);
+    pad_to_column(base, 44, &format_step(c.next, ctx, step_width))
+}
+
+fn format_return(
+    step: u16,
+    r: &Return,
+    _module: &Module,
+    ctx: &DumpContext,
+    step_width: usize,
+) -> String {
+    let name = ctx
+        .entrypoint_name(r.ref_id as usize)
+        .map(|s| s.to_string())
+        .unwrap_or_else(|| format!("ref#{}", r.ref_id));
+
+    let base = format!("  {:0w$}      ({name})", step, w = step_width);
+    pad_to_column(base, 44, "▶")
+}
+
+/// Format a step ID, showing entrypoint label or numeric ID.
+fn format_step(step: StepId, ctx: &DumpContext, step_width: usize) -> String {
+    if step == StepId::ACCEPT {
+        return "◼".to_string();
+    }
+    if let Some(label) = ctx.label_for(step) {
+        format!("▶({label})")
+    } else {
+        format!("{:0w$}", step.0, w = step_width)
+    }
+}
+
+/// Format navigation symbol. Called only for non-Stay navigation.
+fn format_nav(nav: Nav) -> String {
+    match nav {
+        Nav::Stay => unreachable!("Stay is handled specially in format_match"),
+        Nav::Down => "*↓".to_string(),
+        Nav::DownSkip => "~↓".to_string(),
+        Nav::DownExact => ".↓".to_string(),
+        Nav::Next => "* ".to_string(),
+        Nav::NextSkip => "~ ".to_string(),
+        Nav::NextExact => ". ".to_string(),
+        Nav::Up(n) => format!("*↑{}", superscript(n)),
+        Nav::UpSkipTrivia(n) => format!("~↑{}", superscript(n)),
+        Nav::UpExact(n) => format!(".↑{}", superscript(n)),
+    }
+}
+
+fn superscript(n: u8) -> String {
+    const DIGITS: &[char] = &['⁰', '¹', '²', '³', '⁴', '⁵', '⁶', '⁷', '⁸', '⁹'];
+    if n < 10 {
+        DIGITS[n as usize].to_string()
+    } else {
+        n.to_string()
+            .chars()
+            .map(|c| DIGITS[c.to_digit(10).unwrap() as usize])
+            .collect()
+    }
+}
+
+fn format_effect(effect: &super::EffectOp) -> String {
+    match effect.opcode {
+        EffectOpcode::Node => "Node".to_string(),
+        EffectOpcode::A => "A".to_string(),
+        EffectOpcode::Push => "Push".to_string(),
+        EffectOpcode::EndA => "EndA".to_string(),
+        EffectOpcode::S => "S".to_string(),
+        EffectOpcode::EndS => "EndS".to_string(),
+        EffectOpcode::Set => format!("Set(M{})", effect.payload),
+        EffectOpcode::E => format!("E(M{})", effect.payload),
+        EffectOpcode::EndE => "EndE".to_string(),
+        EffectOpcode::Text => "Text".to_string(),
+        EffectOpcode::Clear => "Clear".to_string(),
+        EffectOpcode::Null => "Null".to_string(),
+    }
+}
diff --git a/crates/plotnik-lib/src/bytecode/header.rs b/crates/plotnik-lib/src/bytecode/header.rs
index 988fe535..8b9686df 100644
--- a/crates/plotnik-lib/src/bytecode/header.rs
+++ b/crates/plotnik-lib/src/bytecode/header.rs
@@ -2,6 +2,13 @@
 
 use super::{MAGIC, VERSION};
 
+/// Header flags (bit field).
+pub mod flags {
+    /// Bit 0: If set, bytecode is linked (instructions contain NodeTypeId/NodeFieldId).
+    /// If clear, bytecode is unlinked (instructions contain StringId references).
+    pub const LINKED: u16 = 0x0001;
+}
+
 /// File header - first 64 bytes of the bytecode file.
 ///
 /// Note: TypeMeta sub-section counts are stored in the TypeMetaHeader,
@@ -35,8 +42,10 @@ pub struct Header {
     pub trivia_count: u16,
     pub entrypoints_count: u16,
     pub transitions_count: u16,
+    /// Header flags (see `flags` module for bit definitions).
+    pub flags: u16,
     /// Padding to maintain 64-byte size.
-    pub(crate) _pad: u32,
+    pub(crate) _pad: u16,
 }
 
 const _: () = assert!(std::mem::size_of::<Header>() == 64);
@@ -62,6 +71,7 @@ impl Default for Header {
             trivia_count: 0,
             entrypoints_count: 0,
             transitions_count: 0,
+            flags: 0,
             _pad: 0,
         }
     }
@@ -91,7 +101,8 @@ impl Header {
             trivia_count: u16::from_le_bytes([bytes[54], bytes[55]]),
             entrypoints_count: u16::from_le_bytes([bytes[56], bytes[57]]),
             transitions_count: u16::from_le_bytes([bytes[58], bytes[59]]),
-            _pad: u32::from_le_bytes([bytes[60], bytes[61], bytes[62], bytes[63]]),
+            flags: u16::from_le_bytes([bytes[60], bytes[61]]),
+            _pad: u16::from_le_bytes([bytes[62], bytes[63]]),
         }
     }
 
@@ -116,7 +127,8 @@ impl Header {
         bytes[54..56].copy_from_slice(&self.trivia_count.to_le_bytes());
         bytes[56..58].copy_from_slice(&self.entrypoints_count.to_le_bytes());
         bytes[58..60].copy_from_slice(&self.transitions_count.to_le_bytes());
-        bytes[60..64].copy_from_slice(&self._pad.to_le_bytes());
+        bytes[60..62].copy_from_slice(&self.flags.to_le_bytes());
+        bytes[62..64].copy_from_slice(&self._pad.to_le_bytes());
         bytes
     }
 
@@ -127,6 +139,20 @@ impl Header {
     pub fn validate_version(&self) -> bool {
         self.version == VERSION
     }
+
+    /// Returns true if the bytecode is linked (contains resolved grammar IDs).
+    pub fn is_linked(&self) -> bool {
+        self.flags & flags::LINKED != 0
+    }
+
+    /// Set the linked flag.
+    pub fn set_linked(&mut self, linked: bool) {
+        if linked {
+            self.flags |= flags::LINKED;
+        } else {
+            self.flags &= !flags::LINKED;
+        }
+    }
 }
 
 #[cfg(test)]
@@ -176,4 +202,30 @@ mod tests {
         let decoded = Header::from_bytes(&bytes);
         assert_eq!(decoded, h);
     }
+
+    #[test]
+    fn header_linked_flag() {
+        let mut h = Header::default();
+        assert!(!h.is_linked());
+
+        h.set_linked(true);
+        assert!(h.is_linked());
+        assert_eq!(h.flags, flags::LINKED);
+
+        h.set_linked(false);
+        assert!(!h.is_linked());
+        assert_eq!(h.flags, 0);
+    }
+
+    #[test]
+    fn header_flags_roundtrip() {
+        let mut h = Header::default();
+        h.set_linked(true);
+
+        let bytes = h.to_bytes();
+        let decoded = Header::from_bytes(&bytes);
+
+        assert!(decoded.is_linked());
+        assert_eq!(decoded.flags, flags::LINKED);
+    }
 }
diff --git a/crates/plotnik-lib/src/bytecode/ir.rs b/crates/plotnik-lib/src/bytecode/ir.rs
new file mode 100644
index 00000000..e42485dc
--- /dev/null
+++ b/crates/plotnik-lib/src/bytecode/ir.rs
@@ -0,0 +1,315 @@
+//! Instruction IR with symbolic labels.
+//!
+//! Pre-layout instructions use `Label` for symbolic references.
+//! After layout, labels are resolved to `StepId` for serialization.
+
+use std::collections::BTreeMap;
+use std::num::NonZeroU16;
+
+use super::effects::EffectOp;
+use super::ids::StepId;
+use super::instructions::{Call, Match, Return, select_match_opcode};
+use super::nav::Nav;
+
+/// Symbolic reference, resolved to StepId at layout time.
+#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Debug)]
+pub struct Label(pub u32);
+
+impl Label {
+    /// Sentinel for terminal (accept) state.
+    pub const ACCEPT: Label = Label(u32::MAX);
+
+    #[inline]
+    pub fn is_accept(self) -> bool {
+        self.0 == u32::MAX
+    }
+
+    /// Resolve this label to a StepId using the layout mapping.
+    #[inline]
+    pub fn resolve(self, map: &BTreeMap<Label, StepId>) -> StepId {
+        if self.is_accept() {
+            return StepId::ACCEPT;
+        }
+        *map.get(&self).unwrap_or(&StepId::ACCEPT)
+    }
+}
+
+/// Pre-layout instruction with symbolic references.
+#[derive(Clone, Debug)]
+pub enum Instruction {
+    Match(MatchIR),
+    Call(CallIR),
+    Return(ReturnIR),
+}
+
+impl Instruction {
+    /// Get the label where this instruction lives.
+    #[inline]
+    pub fn label(&self) -> Label {
+        match self {
+            Self::Match(m) => m.label,
+            Self::Call(c) => c.label,
+            Self::Return(r) => r.label,
+        }
+    }
+
+    /// Compute instruction size in bytes (8, 16, 24, 32, 48, or 64).
+    pub fn size(&self) -> usize {
+        match self {
+            Self::Match(m) => m.size(),
+            Self::Call(_) | Self::Return(_) => 8,
+        }
+    }
+
+    /// Get all successor labels (for graph building).
+    pub fn successors(&self) -> Vec<Label> {
+        match self {
+            Self::Match(m) => m.successors.clone(),
+            Self::Call(c) => vec![c.next],
+            Self::Return(_) => vec![],
+        }
+    }
+
+    /// Resolve labels and serialize to bytecode bytes.
+    pub fn resolve(&self, map: &BTreeMap<Label, StepId>) -> Vec<u8> {
+        match self {
+            Self::Match(m) => m.resolve(map),
+            Self::Call(c) => c.resolve(map).to_vec(),
+            Self::Return(r) => r.resolve().to_vec(),
+        }
+    }
+}
+
+/// Match instruction IR with symbolic successors.
+#[derive(Clone, Debug)]
+pub struct MatchIR {
+    /// Where this instruction lives.
+    pub label: Label,
+    /// Navigation command.
+    pub nav: Nav,
+    /// Node type constraint (None = wildcard).
+    pub node_type: Option<NonZeroU16>,
+    /// Field constraint (None = wildcard).
+    pub node_field: Option<NonZeroU16>,
+    /// Effects to execute before match attempt.
+    pub pre_effects: Vec<EffectOp>,
+    /// Fields that must NOT be present on the node.
+    pub neg_fields: Vec<u16>,
+    /// Effects to execute after successful match.
+    pub post_effects: Vec<EffectOp>,
+    /// Successor labels (empty = accept, 1 = linear, 2+ = branch).
+    pub successors: Vec<Label>,
+}
+
+impl MatchIR {
+    /// Compute instruction size in bytes.
+    pub fn size(&self) -> usize {
+        // Match8 can be used if: no effects, no neg_fields, and at most 1 successor
+        let can_use_match8 = self.pre_effects.is_empty()
+            && self.neg_fields.is_empty()
+            && self.post_effects.is_empty()
+            && self.successors.len() <= 1;
+
+        if can_use_match8 {
+            return 8;
+        }
+
+        // Extended match: count all payload slots
+        let slots = self.pre_effects.len()
+            + self.neg_fields.len()
+            + self.post_effects.len()
+            + self.successors.len();
+
+        select_match_opcode(slots)
+            .map(|op| op.size())
+            .unwrap_or(64)
+    }
+
+    /// Resolve labels and serialize to bytecode bytes.
+    pub fn resolve(&self, map: &BTreeMap<Label, StepId>) -> Vec<u8> {
+        let successors: Vec<StepId> = self.successors.iter().map(|&l| l.resolve(map)).collect();
+
+        let m = Match {
+            segment: 0,
+            nav: self.nav,
+            node_type: self.node_type,
+            node_field: self.node_field,
+            pre_effects: self.pre_effects.clone(),
+            neg_fields: self.neg_fields.clone(),
+            post_effects: self.post_effects.clone(),
+            successors,
+        };
+
+        m.to_bytes().expect("instruction too large")
+    }
+
+    /// Check if this is an epsilon transition (no node interaction).
+    #[inline]
+    pub fn is_epsilon(&self) -> bool {
+        self.nav == Nav::Stay && self.node_type.is_none() && self.node_field.is_none()
+    }
+}
+
+/// Call instruction IR with symbolic target.
+#[derive(Clone, Debug)]
+pub struct CallIR {
+    /// Where this instruction lives.
+    pub label: Label,
+    /// Return address (where to continue after callee returns).
+    pub next: Label,
+    /// Callee entry point.
+    pub target: Label,
+    /// Definition identifier for stack validation.
+    pub ref_id: u16,
+}
+
+impl CallIR {
+    /// Resolve labels and serialize to bytecode bytes.
+    pub fn resolve(&self, map: &BTreeMap<Label, StepId>) -> [u8; 8] {
+        let c = Call {
+            segment: 0,
+            next: self.next.resolve(map),
+            target: self.target.resolve(map),
+            ref_id: self.ref_id,
+        };
+        c.to_bytes()
+    }
+}
+
+/// Return instruction IR.
+#[derive(Clone, Debug)]
+pub struct ReturnIR {
+    /// Where this instruction lives.
+    pub label: Label,
+    /// Definition identifier for stack validation.
+    pub ref_id: u16,
+}
+
+impl ReturnIR {
+    /// Serialize to bytecode bytes (no labels to resolve).
+    pub fn resolve(&self) -> [u8; 8] {
+        let r = Return {
+            segment: 0,
+            ref_id: self.ref_id,
+        };
+
+        r.to_bytes()
+    }
+}
+
+/// Result of layout: maps labels to step IDs.
+#[derive(Clone, Debug)]
+pub struct LayoutResult {
+    /// Mapping from symbolic labels to concrete step IDs.
+    pub label_to_step: BTreeMap<Label, StepId>,
+    /// Total number of steps (for header).
+    pub total_steps: u16,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn label_accept_sentinel() {
+        assert!(Label::ACCEPT.is_accept());
+        assert!(!Label(0).is_accept());
+        assert!(!Label(100).is_accept());
+    }
+
+    #[test]
+    fn match_ir_size_match8() {
+        let m = MatchIR {
+            label: Label(0),
+            nav: Nav::Down,
+            node_type: NonZeroU16::new(10),
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(1)],
+        };
+
+        assert_eq!(m.size(), 8);
+    }
+
+    #[test]
+    fn match_ir_size_extended() {
+        let m = MatchIR {
+            label: Label(0),
+            nav: Nav::Down,
+            node_type: NonZeroU16::new(10),
+            node_field: None,
+            pre_effects: vec![EffectOp {
+                opcode: super::super::effects::EffectOpcode::S,
+                payload: 0,
+            }],
+            neg_fields: vec![],
+            post_effects: vec![EffectOp {
+                opcode: super::super::effects::EffectOpcode::Node,
+                payload: 0,
+            }],
+            successors: vec![Label(1)],
+        };
+
+        // 3 slots needed (1 pre + 1 post + 1 succ), fits in Match16 (4 slots)
+        assert_eq!(m.size(), 16);
+    }
+
+    #[test]
+    fn instruction_successors() {
+        let m = Instruction::Match(MatchIR {
+            label: Label(0),
+            nav: Nav::Stay,
+            node_type: None,
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(1), Label(2)],
+        });
+
+        assert_eq!(m.successors(), vec![Label(1), Label(2)]);
+
+        let c = Instruction::Call(CallIR {
+            label: Label(3),
+            next: Label(4),
+            target: Label(5),
+            ref_id: 0,
+        });
+
+        assert_eq!(c.successors(), vec![Label(4)]);
+
+        let r = Instruction::Return(ReturnIR {
+            label: Label(6),
+            ref_id: 0,
+        });
+
+        assert!(r.successors().is_empty());
+    }
+
+    #[test]
+    fn resolve_match_with_accept() {
+        let m = MatchIR {
+            label: Label(0),
+            nav: Nav::Stay,
+            node_type: None,
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label::ACCEPT],
+        };
+
+        let mut map = BTreeMap::new();
+        map.insert(Label(0), StepId(1));
+
+        let bytes = m.resolve(&map);
+        assert_eq!(bytes.len(), 8);
+
+        // Verify opcode is Match8 (0x0)
+        assert_eq!(bytes[0] & 0xF, 0);
+        // Verify next is ACCEPT (0)
+        assert_eq!(u16::from_le_bytes([bytes[6], bytes[7]]), 0);
+    }
+}
diff --git a/crates/plotnik-lib/src/bytecode/layout.rs b/crates/plotnik-lib/src/bytecode/layout.rs
new file mode 100644
index 00000000..acadf972
--- /dev/null
+++ b/crates/plotnik-lib/src/bytecode/layout.rs
@@ -0,0 +1,184 @@
+//! Cache-aligned instruction layout.
+//!
+//! Uses Pettis-Hansen inspired greedy chain extraction to place
+//! hot paths contiguously and avoid cache line straddling.
+
+use std::collections::{BTreeMap, HashSet};
+
+use super::ids::StepId;
+use super::ir::{Instruction, Label, LayoutResult};
+
+const CACHE_LINE: usize = 64;
+const STEP_SIZE: usize = 8;
+
+/// Successor graph for layout analysis.
+struct Graph {
+    /// label -> list of successor labels
+    successors: BTreeMap<Label, Vec<Label>>,
+    /// label -> list of predecessor labels
+    predecessors: BTreeMap<Label, Vec<Label>>,
+}
+
+impl Graph {
+    fn build(instructions: &[Instruction]) -> Self {
+        let mut successors: BTreeMap<Label, Vec<Label>> = BTreeMap::new();
+        let mut predecessors: BTreeMap<Label, Vec<Label>> = BTreeMap::new();
+
+        for instr in instructions {
+            let label = instr.label();
+            successors.entry(label).or_default();
+
+            for succ in instr.successors() {
+                if succ.is_accept() {
+                    continue;
+                }
+                successors.entry(label).or_default().push(succ);
+                predecessors.entry(succ).or_default().push(label);
+            }
+        }
+
+        Self {
+            successors,
+            predecessors,
+        }
+    }
+
+    fn successors(&self, label: Label) -> &[Label] {
+        self.successors.get(&label).map(|v| v.as_slice()).unwrap_or(&[])
+    }
+
+    fn predecessor_count(&self, label: Label) -> usize {
+        self.predecessors.get(&label).map(|v| v.len()).unwrap_or(0)
+    }
+}
+
+/// Cache-aligned layout strategy.
+pub struct CacheAligned;
+
+impl CacheAligned {
+    /// Compute layout for instructions with given entry points.
+    ///
+    /// Returns mapping from labels to step IDs and total step count.
+    pub fn layout(instructions: &[Instruction], entries: &[Label]) -> LayoutResult {
+        if instructions.is_empty() {
+            return LayoutResult {
+                label_to_step: BTreeMap::from([(Label::ACCEPT, StepId::ACCEPT)]),
+                total_steps: 1,
+            };
+        }
+
+        let graph = Graph::build(instructions);
+        let label_to_instr: BTreeMap<Label, &Instruction> =
+            instructions.iter().map(|i| (i.label(), i)).collect();
+
+        let chains = extract_chains(&graph, instructions, entries);
+        let ordered = order_chains(chains, entries);
+
+        assign_step_ids(ordered, &label_to_instr)
+    }
+}
+
+/// Extract linear chains from the control flow graph.
+fn extract_chains(graph: &Graph, instructions: &[Instruction], entries: &[Label]) -> Vec<Vec<Label>> {
+    let mut visited = HashSet::new();
+    let mut chains = Vec::new();
+
+    // Start with entry points (hot paths)
+    for &entry in entries {
+        if visited.contains(&entry) {
+            continue;
+        }
+        chains.push(build_chain(entry, graph, &mut visited));
+    }
+
+    // Then remaining unvisited instructions
+    for instr in instructions {
+        let label = instr.label();
+        if visited.contains(&label) {
+            continue;
+        }
+        chains.push(build_chain(label, graph, &mut visited));
+    }
+
+    chains
+}
+
+/// Build a single chain starting from a label.
+///
+/// Extends the chain while there's a single unvisited successor with a single predecessor.
+fn build_chain(start: Label, graph: &Graph, visited: &mut HashSet<Label>) -> Vec<Label> {
+    let mut chain = vec![start];
+    visited.insert(start);
+
+    let mut current = start;
+    while let [next] = graph.successors(current)
+        && !visited.contains(next)
+        && graph.predecessor_count(*next) == 1
+    {
+        chain.push(*next);
+        visited.insert(*next);
+        current = *next;
+    }
+
+    chain
+}
+
+/// Order chains: entries first, then by size (larger = hotter assumption).
+fn order_chains(mut chains: Vec<Vec<Label>>, entries: &[Label]) -> Vec<Vec<Label>> {
+    let entry_set: HashSet<Label> = entries.iter().copied().collect();
+
+    // Partition into entry chains and non-entry chains
+    let (mut entry_chains, mut other_chains): (Vec<_>, Vec<_>) = chains
+        .drain(..)
+        .partition(|chain| chain.first().map(|l| entry_set.contains(l)).unwrap_or(false));
+
+    // Sort other chains by size (descending) for better locality
+    other_chains.sort_by_key(|chain| std::cmp::Reverse(chain.len()));
+
+    // Entry chains first, then others
+    entry_chains.extend(other_chains);
+    entry_chains
+}
+
+/// Assign step IDs with cache line awareness.
+fn assign_step_ids(
+    chains: Vec<Vec<Label>>,
+    label_to_instr: &BTreeMap<Label, &Instruction>,
+) -> LayoutResult {
+    let mut mapping = BTreeMap::new();
+    mapping.insert(Label::ACCEPT, StepId::ACCEPT);
+
+    let mut current_step = 1u16; // 0 is ACCEPT
+    let mut current_offset = 0usize; // Byte offset for cache alignment
+
+    for chain in chains {
+        for label in chain {
+            let Some(instr) = label_to_instr.get(&label) else {
+                continue;
+            };
+            let size = instr.size();
+
+            // Cache line alignment for large instructions
+            if size >= 48 {
+                let line_offset = current_offset % CACHE_LINE;
+                if line_offset + size > CACHE_LINE {
+                    // Would straddle cache line - pad to next line
+                    let padding_bytes = CACHE_LINE - line_offset;
+                    let padding_steps = (padding_bytes / STEP_SIZE) as u16;
+                    current_step += padding_steps;
+                    current_offset += padding_bytes;
+                }
+            }
+
+            mapping.insert(label, StepId(current_step));
+            let step_count = (size / STEP_SIZE) as u16;
+            current_step += step_count;
+            current_offset += size;
+        }
+    }
+
+    LayoutResult {
+        label_to_step: mapping,
+        total_steps: current_step,
+    }
+}
diff --git a/crates/plotnik-lib/src/bytecode/layout_tests.rs b/crates/plotnik-lib/src/bytecode/layout_tests.rs
new file mode 100644
index 00000000..d2e4543f
--- /dev/null
+++ b/crates/plotnik-lib/src/bytecode/layout_tests.rs
@@ -0,0 +1,243 @@
+use std::num::NonZeroU16;
+
+use super::ids::StepId;
+use super::ir::{CallIR, Instruction, Label, MatchIR, ReturnIR};
+use super::layout::CacheAligned;
+use crate::bytecode::effects::{EffectOp, EffectOpcode};
+use crate::bytecode::nav::Nav;
+
+#[test]
+fn layout_empty() {
+    let result = CacheAligned::layout(&[], &[]);
+
+    assert_eq!(result.total_steps, 1);
+    assert_eq!(result.label_to_step.get(&Label::ACCEPT), Some(&StepId::ACCEPT));
+}
+
+#[test]
+fn layout_single_instruction() {
+    let instructions = vec![Instruction::Match(MatchIR {
+        label: Label(0),
+        nav: Nav::Down,
+        node_type: NonZeroU16::new(10),
+        node_field: None,
+        pre_effects: vec![],
+        neg_fields: vec![],
+        post_effects: vec![],
+        successors: vec![Label::ACCEPT],
+    })];
+
+    let result = CacheAligned::layout(&instructions, &[Label(0)]);
+
+    assert_eq!(result.label_to_step.get(&Label(0)), Some(&StepId(1)));
+    assert_eq!(result.total_steps, 2); // 1 instruction + 1 step
+}
+
+#[test]
+fn layout_linear_chain() {
+    // A -> B -> C -> ACCEPT
+    let instructions = vec![
+        Instruction::Match(MatchIR {
+            label: Label(0),
+            nav: Nav::Down,
+            node_type: NonZeroU16::new(10),
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(1)],
+        }),
+        Instruction::Match(MatchIR {
+            label: Label(1),
+            nav: Nav::Next,
+            node_type: NonZeroU16::new(20),
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(2)],
+        }),
+        Instruction::Match(MatchIR {
+            label: Label(2),
+            nav: Nav::Up(1),
+            node_type: None,
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label::ACCEPT],
+        }),
+    ];
+
+    let result = CacheAligned::layout(&instructions, &[Label(0)]);
+
+    // Should be contiguous: 1, 2, 3
+    assert_eq!(result.label_to_step.get(&Label(0)), Some(&StepId(1)));
+    assert_eq!(result.label_to_step.get(&Label(1)), Some(&StepId(2)));
+    assert_eq!(result.label_to_step.get(&Label(2)), Some(&StepId(3)));
+}
+
+#[test]
+fn layout_call_return() {
+    // Entry -> Call(target=2) -> Return
+    let instructions = vec![
+        Instruction::Match(MatchIR {
+            label: Label(0),
+            nav: Nav::Down,
+            node_type: NonZeroU16::new(10),
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(1)],
+        }),
+        Instruction::Call(CallIR {
+            label: Label(1),
+            next: Label(3),
+            target: Label(2),
+            ref_id: 0,
+        }),
+        Instruction::Match(MatchIR {
+            label: Label(2),
+            nav: Nav::Down,
+            node_type: NonZeroU16::new(20),
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(4)],
+        }),
+        Instruction::Match(MatchIR {
+            label: Label(3),
+            nav: Nav::Up(1),
+            node_type: None,
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label::ACCEPT],
+        }),
+        Instruction::Return(ReturnIR {
+            label: Label(4),
+            ref_id: 0,
+        }),
+    ];
+
+    let result = CacheAligned::layout(&instructions, &[Label(0)]);
+
+    // All labels should have valid step IDs
+    assert!(result.label_to_step.contains_key(&Label(0)));
+    assert!(result.label_to_step.contains_key(&Label(1)));
+    assert!(result.label_to_step.contains_key(&Label(2)));
+    assert!(result.label_to_step.contains_key(&Label(3)));
+    assert!(result.label_to_step.contains_key(&Label(4)));
+}
+
+#[test]
+fn layout_branch() {
+    // Entry -> [A, B] -> ACCEPT
+    let instructions = vec![
+        Instruction::Match(MatchIR {
+            label: Label(0),
+            nav: Nav::Stay,
+            node_type: None,
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(1), Label(2)],
+        }),
+        Instruction::Match(MatchIR {
+            label: Label(1),
+            nav: Nav::Down,
+            node_type: NonZeroU16::new(10),
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label::ACCEPT],
+        }),
+        Instruction::Match(MatchIR {
+            label: Label(2),
+            nav: Nav::Down,
+            node_type: NonZeroU16::new(20),
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label::ACCEPT],
+        }),
+    ];
+
+    let result = CacheAligned::layout(&instructions, &[Label(0)]);
+
+    // All should have distinct step IDs
+    let step0 = result.label_to_step.get(&Label(0)).unwrap();
+    let step1 = result.label_to_step.get(&Label(1)).unwrap();
+    let step2 = result.label_to_step.get(&Label(2)).unwrap();
+
+    assert_ne!(step0, step1);
+    assert_ne!(step1, step2);
+    assert_ne!(step0, step2);
+}
+
+#[test]
+fn layout_large_instruction_cache_alignment() {
+    // Large instruction (Match48 = 48 bytes = 6 steps) near cache line boundary
+    // Start at step 5 (offset 40), would straddle - should pad
+    let large_match = MatchIR {
+        label: Label(1),
+        nav: Nav::Down,
+        node_type: NonZeroU16::new(10),
+        node_field: None,
+        pre_effects: vec![
+            EffectOp { opcode: EffectOpcode::S, payload: 0 },
+            EffectOp { opcode: EffectOpcode::S, payload: 0 },
+            EffectOp { opcode: EffectOpcode::S, payload: 0 },
+        ],
+        neg_fields: vec![],
+        post_effects: vec![
+            EffectOp { opcode: EffectOpcode::Node, payload: 0 },
+            EffectOp { opcode: EffectOpcode::EndS, payload: 0 },
+            EffectOp { opcode: EffectOpcode::EndS, payload: 0 },
+            EffectOp { opcode: EffectOpcode::EndS, payload: 0 },
+        ],
+        successors: vec![
+            Label::ACCEPT,
+            Label::ACCEPT,
+            Label::ACCEPT,
+            Label::ACCEPT,
+            Label::ACCEPT,
+            Label::ACCEPT,
+            Label::ACCEPT,
+            Label::ACCEPT,
+        ],
+    };
+
+    // Verify it's large enough to trigger alignment
+    assert!(large_match.size() >= 48);
+
+    let instructions = vec![
+        // 5 small instructions to push offset to 40
+        Instruction::Match(MatchIR {
+            label: Label(0),
+            nav: Nav::Stay,
+            node_type: None,
+            node_field: None,
+            pre_effects: vec![],
+            neg_fields: vec![],
+            post_effects: vec![],
+            successors: vec![Label(1)],
+        }),
+        Instruction::Match(large_match),
+    ];
+
+    let result = CacheAligned::layout(&instructions, &[Label(0)]);
+
+    // Label 0 at step 1 (offset 8)
+    assert_eq!(result.label_to_step.get(&Label(0)), Some(&StepId(1)));
+
+    // Label 1 should be aligned - either at step 2 or padded to cache line
+    let step1 = result.label_to_step.get(&Label(1)).unwrap();
+    assert!(step1.0 >= 2);
+}
diff --git a/crates/plotnik-lib/src/bytecode/mod.rs b/crates/plotnik-lib/src/bytecode/mod.rs
index 9fd33cc9..e288c04a 100644
--- a/crates/plotnik-lib/src/bytecode/mod.rs
+++ b/crates/plotnik-lib/src/bytecode/mod.rs
@@ -3,12 +3,15 @@
 //! Implements the binary format specified in `docs/binary-format/`.
 
 mod constants;
+mod dump;
 mod effects;
 pub mod emit;
 mod entrypoint;
 mod header;
 mod ids;
 mod instructions;
+pub mod ir;
+pub mod layout;
 mod module;
 mod nav;
 mod sections;
@@ -21,7 +24,7 @@ pub use constants::{
 
 pub use ids::{QTypeId, StepId, StringId};
 
-pub use header::Header;
+pub use header::{flags, Header};
 
 pub use sections::{FieldSymbol, NodeSymbol, Slice, TriviaEntry};
 
@@ -42,7 +45,11 @@ pub use module::{
     SymbolsView, TriviaView, TypesView,
 };
 
+pub use dump::dump;
+
 #[cfg(test)]
 mod instructions_tests;
 #[cfg(test)]
+mod layout_tests;
+#[cfg(test)]
 mod module_tests;