From db4163bc7200de94e6a270022982458d08b0e4cf Mon Sep 17 00:00:00 2001
From: Sergei Zharinov <zharinov@users.noreply.github.com>
Date: Mon, 29 Dec 2025 15:06:35 -0300
Subject: [PATCH] feat: add bytecode instruction decoding

Add instruction types and serialization:
- Match8/16/24 variants for node type matching
- Call/Return for state machine transitions
- Opcode enum with from_bytes/to_bytes
---
 .../plotnik-lib/src/bytecode/instructions.rs  | 567 ++++++++++++++++++
 .../src/bytecode/instructions_tests.rs        | 267 +++++++++
 crates/plotnik-lib/src/bytecode/mod.rs        |   8 +
 3 files changed, 842 insertions(+)
 create mode 100644 crates/plotnik-lib/src/bytecode/instructions.rs
 create mode 100644 crates/plotnik-lib/src/bytecode/instructions_tests.rs
diff --git a/crates/plotnik-lib/src/bytecode/instructions.rs b/crates/plotnik-lib/src/bytecode/instructions.rs
new file mode 100644
index 00000000..c9dd6921
--- /dev/null
+++ b/crates/plotnik-lib/src/bytecode/instructions.rs
@@ -0,0 +1,567 @@
+//! Bytecode instruction definitions.
+//!
+//! Instructions are runtime-friendly structs with `from_bytes`/`to_bytes`
+//! methods for bytecode serialization.
+
+use std::num::NonZeroU16;
+
+use super::constants::{SECTION_ALIGN, STEP_SIZE};
+use super::effects::EffectOp;
+use super::ids::StepId;
+use super::nav::Nav;
+
+/// Read `count` little-endian u16 values from bytes starting at `offset`.
+/// Advances `offset` by `count * 2`.
+#[inline]
+fn read_u16_vec(bytes: &[u8], offset: &mut usize, count: usize) -> Vec<u16> {
+    (0..count)
+        .map(|_| {
+            let v = u16::from_le_bytes([bytes[*offset], bytes[*offset + 1]]);
+            *offset += 2;
+            v
+        })
+        .collect()
+}
+
+/// Instruction opcodes (4-bit).
+#[derive(Clone, Copy, PartialEq, Eq, Debug)]
+#[repr(u8)]
+pub enum Opcode {
+    Match8 = 0x0,
+    Match16 = 0x1,
+    Match24 = 0x2,
+    Match32 = 0x3,
+    Match48 = 0x4,
+    Match64 = 0x5,
+    Call = 0x6,
+    Return = 0x7,
+}
+
+impl Opcode {
+    pub fn from_u8(v: u8) -> Self {
+        match v {
+            0x0 => Self::Match8,
+            0x1 => Self::Match16,
+            0x2 => Self::Match24,
+            0x3 => Self::Match32,
+            0x4 => Self::Match48,
+            0x5 => Self::Match64,
+            0x6 => Self::Call,
+            0x7 => Self::Return,
+            _ => panic!("invalid opcode: {v}"),
+        }
+    }
+
+    /// Instruction size in bytes.
+    pub fn size(self) -> usize {
+        match self {
+            Self::Match8 => 8,
+            Self::Match16 => 16,
+            Self::Match24 => 24,
+            Self::Match32 => 32,
+            Self::Match48 => 48,
+            Self::Match64 => 64,
+            Self::Call => 8,
+            Self::Return => 8,
+        }
+    }
+
+    /// Number of steps this instruction occupies.
+    pub fn step_count(self) -> u16 {
+        (self.size() / STEP_SIZE) as u16
+    }
+
+    /// Whether this is a Match variant.
+    pub fn is_match(self) -> bool {
+        matches!(
+            self,
+            Self::Match8
+                | Self::Match16
+                | Self::Match24
+                | Self::Match32
+                | Self::Match48
+                | Self::Match64
+        )
+    }
+
+    /// Whether this is an extended Match (Match16-64).
+    pub fn is_extended_match(self) -> bool {
+        matches!(
+            self,
+            Self::Match16 | Self::Match24 | Self::Match32 | Self::Match48 | Self::Match64
+        )
+    }
+
+    /// Payload capacity in u16 slots for extended Match variants.
+    pub fn payload_slots(self) -> usize {
+        match self {
+            Self::Match16 => 4,
+            Self::Match24 => 8,
+            Self::Match32 => 12,
+            Self::Match48 => 20,
+            Self::Match64 => 28,
+            _ => 0,
+        }
+    }
+}
+
+/// Match instruction for pattern matching in the VM.
+///
+/// Unifies Match8 (fast-path) and Match16-64 (extended) wire formats into
+/// a single runtime-friendly struct.
+#[derive(Clone, PartialEq, Eq, Debug)]
+pub struct Match {
+    /// Segment index (0-15, currently only 0 is used).
+    pub segment: u8,
+    /// Navigation command.
+    pub nav: Nav,
+    /// Node type constraint (None = wildcard).
+    pub node_type: Option<NonZeroU16>,
+    /// Field constraint (None = wildcard).
+    pub node_field: Option<NonZeroU16>,
+    /// Effects to execute before match attempt.
+    pub pre_effects: Vec<EffectOp>,
+    /// Fields that must NOT be present on the node.
+    pub neg_fields: Vec<u16>,
+    /// Effects to execute after successful match.
+    pub post_effects: Vec<EffectOp>,
+    /// Successor step IDs (empty = accept, 1 = linear, 2+ = branch).
+    pub successors: Vec<StepId>,
+}
+
+impl Match {
+    /// Check if this is a terminal (accept) state.
+    #[inline]
+    pub fn is_terminal(&self) -> bool {
+        self.successors.is_empty()
+    }
+
+    /// Check if this is an epsilon transition (no node interaction).
+    #[inline]
+    pub fn is_epsilon(&self) -> bool {
+        self.nav == Nav::Stay && self.node_type.is_none() && self.node_field.is_none()
+    }
+
+    /// Decode from bytecode bytes.
+    ///
+    /// The slice must start at the instruction and contain at least
+    /// the full instruction size (determined by opcode).
+    pub fn from_bytes(bytes: &[u8]) -> Self {
+        assert!(bytes.len() >= 8, "Match instruction too short");
+
+        let type_id_byte = bytes[0];
+        let segment = type_id_byte >> 4;
+        assert!(
+            segment == 0,
+            "non-zero segment not yet supported: {segment}"
+        );
+        let opcode = Opcode::from_u8(type_id_byte & 0xF);
+
+        assert!(opcode.is_match(), "expected Match opcode, got {opcode:?}");
+        assert!(
+            bytes.len() >= opcode.size(),
+            "Match instruction truncated: expected {} bytes, got {}",
+            opcode.size(),
+            bytes.len()
+        );
+
+        let nav = Nav::from_byte(bytes[1]);
+        let node_type = NonZeroU16::new(u16::from_le_bytes([bytes[2], bytes[3]]));
+        let node_field = NonZeroU16::new(u16::from_le_bytes([bytes[4], bytes[5]]));
+
+        if opcode == Opcode::Match8 {
+            // Match8: single successor in bytes 6-7
+            let next = StepId(u16::from_le_bytes([bytes[6], bytes[7]]));
+            let successors = if next.is_accept() { vec![] } else { vec![next] };
+
+            Self {
+                segment,
+                nav,
+                node_type,
+                node_field,
+                pre_effects: vec![],
+                neg_fields: vec![],
+                post_effects: vec![],
+                successors,
+            }
+        } else {
+            // Extended match: parse counts and payload
+            let counts = u16::from_le_bytes([bytes[6], bytes[7]]);
+            let pre_count = ((counts >> 13) & 0x7) as usize;
+            let neg_count = ((counts >> 10) & 0x7) as usize;
+            let post_count = ((counts >> 7) & 0x7) as usize;
+            let succ_count = ((counts >> 1) & 0x3F) as usize;
+
+            let payload = &bytes[8..];
+            let mut offset = 0;
+
+            let pre_effects = read_u16_vec(payload, &mut offset, pre_count)
+                .into_iter()
+                .map(|v| EffectOp::from_bytes(v.to_le_bytes()))
+                .collect();
+            let neg_fields = read_u16_vec(payload, &mut offset, neg_count);
+            let post_effects = read_u16_vec(payload, &mut offset, post_count)
+                .into_iter()
+                .map(|v| EffectOp::from_bytes(v.to_le_bytes()))
+                .collect();
+            let successors = read_u16_vec(payload, &mut offset, succ_count)
+                .into_iter()
+                .map(StepId)
+                .collect();
+
+            Self {
+                segment,
+                nav,
+                node_type,
+                node_field,
+                pre_effects,
+                neg_fields,
+                post_effects,
+                successors,
+            }
+        }
+    }
+
+    /// Encode to bytecode bytes.
+    ///
+    /// Automatically selects the smallest opcode that fits the payload.
+    /// Returns None if the payload is too large (> 28 u16 slots).
+    pub fn to_bytes(&self) -> Option<Vec<u8>> {
+        // Match8 can be used if: no effects, no neg_fields, and at most 1 successor
+        let can_use_match8 = self.pre_effects.is_empty()
+            && self.neg_fields.is_empty()
+            && self.post_effects.is_empty()
+            && self.successors.len() <= 1;
+
+        let opcode = if can_use_match8 {
+            Opcode::Match8
+        } else {
+            // Extended match: count all payload slots
+            let slots_needed = self.pre_effects.len()
+                + self.neg_fields.len()
+                + self.post_effects.len()
+                + self.successors.len();
+            select_match_opcode(slots_needed)?
+        };
+        let size = opcode.size();
+        let mut bytes = vec![0u8; size];
+
+        // Type ID byte
+        bytes[0] = (self.segment << 4) | (opcode as u8);
+        bytes[1] = self.nav.to_byte();
+
+        // Node type/field
+        let node_type_val = self.node_type.map(|n| n.get()).unwrap_or(0);
+        bytes[2..4].copy_from_slice(&node_type_val.to_le_bytes());
+        let node_field_val = self.node_field.map(|n| n.get()).unwrap_or(0);
+        bytes[4..6].copy_from_slice(&node_field_val.to_le_bytes());
+
+        if opcode == Opcode::Match8 {
+            // Match8: single successor or accept
+            let next = self.successors.first().copied().unwrap_or(StepId::ACCEPT);
+            bytes[6..8].copy_from_slice(&next.0.to_le_bytes());
+        } else {
+            // Extended match: pack counts and payload
+            let pre_count = self.pre_effects.len() as u16;
+            let neg_count = self.neg_fields.len() as u16;
+            let post_count = self.post_effects.len() as u16;
+            let succ_count = self.successors.len() as u16;
+
+            let counts =
+                (pre_count << 13) | (neg_count << 10) | (post_count << 7) | (succ_count << 1);
+            bytes[6..8].copy_from_slice(&counts.to_le_bytes());
+
+            let mut offset = 8;
+
+            // Write pre_effects
+            for effect in &self.pre_effects {
+                bytes[offset..offset + 2].copy_from_slice(&effect.to_bytes());
+                offset += 2;
+            }
+
+            // Write neg_fields
+            for &field in &self.neg_fields {
+                bytes[offset..offset + 2].copy_from_slice(&field.to_le_bytes());
+                offset += 2;
+            }
+
+            // Write post_effects
+            for effect in &self.post_effects {
+                bytes[offset..offset + 2].copy_from_slice(&effect.to_bytes());
+                offset += 2;
+            }
+
+            // Write successors
+            for succ in &self.successors {
+                bytes[offset..offset + 2].copy_from_slice(&succ.0.to_le_bytes());
+                offset += 2;
+            }
+
+            // Remaining bytes are already zero (padding)
+        }
+
+        Some(bytes)
+    }
+}
+
+/// Zero-copy view into a Match instruction for efficient VM execution.
+///
+/// Unlike `Match`, this doesn't allocate - it stores a reference to the
+/// bytecode and provides iterator methods for accessing effects and successors.
+#[derive(Clone, Copy, Debug)]
+pub struct MatchView<'a> {
+    bytes: &'a [u8],
+    /// Segment index (0-15, currently only 0 is used).
+    pub segment: u8,
+    /// Navigation command.
+    pub nav: Nav,
+    /// Node type constraint (None = wildcard).
+    pub node_type: Option<NonZeroU16>,
+    /// Field constraint (None = wildcard).
+    pub node_field: Option<NonZeroU16>,
+    /// Whether this is Match8 (no payload) or extended.
+    is_match8: bool,
+    /// For Match8: the single successor (0 = terminal).
+    match8_next: u16,
+    /// For extended: counts packed into single byte each.
+    pre_count: u8,
+    neg_count: u8,
+    post_count: u8,
+    succ_count: u8,
+}
+
+impl<'a> MatchView<'a> {
+    /// Parse a Match instruction from bytecode without allocating.
+    ///
+    /// The slice must start at the instruction and contain at least
+    /// the full instruction size (determined by opcode).
+    #[inline]
+    pub fn from_bytes(bytes: &'a [u8]) -> Self {
+        debug_assert!(bytes.len() >= 8, "Match instruction too short");
+
+        let type_id_byte = bytes[0];
+        let segment = type_id_byte >> 4;
+        debug_assert!(segment == 0, "non-zero segment not yet supported");
+        let opcode = Opcode::from_u8(type_id_byte & 0xF);
+        debug_assert!(opcode.is_match(), "expected Match opcode");
+
+        let nav = Nav::from_byte(bytes[1]);
+        let node_type = NonZeroU16::new(u16::from_le_bytes([bytes[2], bytes[3]]));
+        let node_field = NonZeroU16::new(u16::from_le_bytes([bytes[4], bytes[5]]));
+
+        if opcode == Opcode::Match8 {
+            let next = u16::from_le_bytes([bytes[6], bytes[7]]);
+            Self {
+                bytes,
+                segment,
+                nav,
+                node_type,
+                node_field,
+                is_match8: true,
+                match8_next: next,
+                pre_count: 0,
+                neg_count: 0,
+                post_count: 0,
+                succ_count: if next == 0 { 0 } else { 1 },
+            }
+        } else {
+            let counts = u16::from_le_bytes([bytes[6], bytes[7]]);
+            Self {
+                bytes,
+                segment,
+                nav,
+                node_type,
+                node_field,
+                is_match8: false,
+                match8_next: 0,
+                pre_count: ((counts >> 13) & 0x7) as u8,
+                neg_count: ((counts >> 10) & 0x7) as u8,
+                post_count: ((counts >> 7) & 0x7) as u8,
+                succ_count: ((counts >> 1) & 0x3F) as u8,
+            }
+        }
+    }
+
+    /// Check if this is a terminal (accept) state.
+    #[inline]
+    pub fn is_terminal(&self) -> bool {
+        self.succ_count == 0
+    }
+
+    /// Check if this is an epsilon transition (no node interaction).
+    #[inline]
+    pub fn is_epsilon(&self) -> bool {
+        self.nav == Nav::Stay && self.node_type.is_none() && self.node_field.is_none()
+    }
+
+    /// Number of successors.
+    #[inline]
+    pub fn succ_count(&self) -> usize {
+        self.succ_count as usize
+    }
+
+    /// Get a successor by index.
+    #[inline]
+    pub fn successor(&self, idx: usize) -> StepId {
+        debug_assert!(
+            idx < self.succ_count as usize,
+            "successor index out of bounds"
+        );
+        if self.is_match8 {
+            debug_assert!(idx == 0);
+            StepId(self.match8_next)
+        } else {
+            let offset = self.succ_offset() + idx * 2;
+            StepId(u16::from_le_bytes([
+                self.bytes[offset],
+                self.bytes[offset + 1],
+            ]))
+        }
+    }
+
+    /// Iterate over pre-effects (executed before match attempt).
+    #[inline]
+    pub fn pre_effects(&self) -> impl Iterator<Item = EffectOp> + '_ {
+        let start = 8; // payload starts at byte 8
+        (0..self.pre_count as usize).map(move |i| {
+            let offset = start + i * 2;
+            EffectOp::from_bytes([self.bytes[offset], self.bytes[offset + 1]])
+        })
+    }
+
+    /// Iterate over negated fields (must NOT be present on matched node).
+    #[inline]
+    pub fn neg_fields(&self) -> impl Iterator<Item = u16> + '_ {
+        let start = 8 + (self.pre_count as usize) * 2;
+        (0..self.neg_count as usize).map(move |i| {
+            let offset = start + i * 2;
+            u16::from_le_bytes([self.bytes[offset], self.bytes[offset + 1]])
+        })
+    }
+
+    /// Iterate over post-effects (executed after successful match).
+    #[inline]
+    pub fn post_effects(&self) -> impl Iterator<Item = EffectOp> + '_ {
+        let start = 8 + (self.pre_count as usize + self.neg_count as usize) * 2;
+        (0..self.post_count as usize).map(move |i| {
+            let offset = start + i * 2;
+            EffectOp::from_bytes([self.bytes[offset], self.bytes[offset + 1]])
+        })
+    }
+
+    /// Iterate over successors.
+    #[inline]
+    pub fn successors(&self) -> impl Iterator<Item = StepId> + '_ {
+        (0..self.succ_count as usize).map(move |i| self.successor(i))
+    }
+
+    /// Byte offset where successors start in the payload.
+    #[inline]
+    fn succ_offset(&self) -> usize {
+        8 + (self.pre_count as usize + self.neg_count as usize + self.post_count as usize) * 2
+    }
+}
+
+/// Call instruction for invoking definitions (recursion).
+#[derive(Clone, Copy, PartialEq, Eq, Debug)]
+pub struct Call {
+    /// Segment index (0-15).
+    pub segment: u8,
+    /// Return address (current segment).
+    pub next: StepId,
+    /// Callee entry point (target segment from type_id).
+    pub target: StepId,
+    /// Definition identifier for stack validation.
+    pub ref_id: u16,
+}
+
+impl Call {
+    /// Decode from 8-byte bytecode.
+    pub fn from_bytes(bytes: [u8; 8]) -> Self {
+        let type_id_byte = bytes[0];
+        let segment = type_id_byte >> 4;
+        assert!(
+            segment == 0,
+            "non-zero segment not yet supported: {segment}"
+        );
+        let opcode = Opcode::from_u8(type_id_byte & 0xF);
+        assert_eq!(opcode, Opcode::Call, "expected Call opcode");
+
+        Self {
+            segment,
+            next: StepId(u16::from_le_bytes([bytes[2], bytes[3]])),
+            target: StepId(u16::from_le_bytes([bytes[4], bytes[5]])),
+            ref_id: u16::from_le_bytes([bytes[6], bytes[7]]),
+        }
+    }
+
+    /// Encode to 8-byte bytecode.
+    pub fn to_bytes(&self) -> [u8; 8] {
+        let mut bytes = [0u8; 8];
+        bytes[0] = (self.segment << 4) | (Opcode::Call as u8);
+        // bytes[1] is reserved
+        bytes[2..4].copy_from_slice(&self.next.0.to_le_bytes());
+        bytes[4..6].copy_from_slice(&self.target.0.to_le_bytes());
+        bytes[6..8].copy_from_slice(&self.ref_id.to_le_bytes());
+        bytes
+    }
+}
+
+/// Return instruction for returning from definitions.
+#[derive(Clone, Copy, PartialEq, Eq, Debug)]
+pub struct Return {
+    /// Segment index (0-15).
+    pub segment: u8,
+    /// Definition identifier for stack validation.
+    pub ref_id: u16,
+}
+
+impl Return {
+    /// Decode from 8-byte bytecode.
+    pub fn from_bytes(bytes: [u8; 8]) -> Self {
+        let type_id_byte = bytes[0];
+        let segment = type_id_byte >> 4;
+        assert!(
+            segment == 0,
+            "non-zero segment not yet supported: {segment}"
+        );
+        let opcode = Opcode::from_u8(type_id_byte & 0xF);
+        assert_eq!(opcode, Opcode::Return, "expected Return opcode");
+
+        Self {
+            segment,
+            ref_id: u16::from_le_bytes([bytes[2], bytes[3]]),
+        }
+    }
+
+    /// Encode to 8-byte bytecode.
+    pub fn to_bytes(&self) -> [u8; 8] {
+        let mut bytes = [0u8; 8];
+        bytes[0] = (self.segment << 4) | (Opcode::Return as u8);
+        // bytes[1] is reserved
+        bytes[2..4].copy_from_slice(&self.ref_id.to_le_bytes());
+        // bytes[4..8] are padding
+        bytes
+    }
+}
+
+/// Select the smallest Match variant that fits the given payload.
+pub fn select_match_opcode(slots_needed: usize) -> Option<Opcode> {
+    if slots_needed == 0 {
+        return Some(Opcode::Match8);
+    }
+    match slots_needed {
+        1..=4 => Some(Opcode::Match16),
+        5..=8 => Some(Opcode::Match24),
+        9..=12 => Some(Opcode::Match32),
+        13..=20 => Some(Opcode::Match48),
+        21..=28 => Some(Opcode::Match64),
+        _ => None, // Too large, must split
+    }
+}
+
+/// Pad a size to the next multiple of SECTION_ALIGN (64 bytes).
+#[inline]
+pub fn align_to_section(size: usize) -> usize {
+    (size + SECTION_ALIGN - 1) & !(SECTION_ALIGN - 1)
+}
diff --git a/crates/plotnik-lib/src/bytecode/instructions_tests.rs b/crates/plotnik-lib/src/bytecode/instructions_tests.rs
new file mode 100644
index 00000000..c3e21604
--- /dev/null
+++ b/crates/plotnik-lib/src/bytecode/instructions_tests.rs
@@ -0,0 +1,267 @@
+//! Tests for bytecode instructions.
+
+use std::num::NonZeroU16;
+
+use super::effects::{EffectOp, EffectOpcode};
+use super::ids::StepId;
+use super::instructions::{
+    Call, Match, MatchView, Opcode, Return, align_to_section, select_match_opcode,
+};
+use super::nav::Nav;
+
+#[test]
+fn opcode_sizes() {
+    assert_eq!(Opcode::Match8.size(), 8);
+    assert_eq!(Opcode::Match16.size(), 16);
+    assert_eq!(Opcode::Match24.size(), 24);
+    assert_eq!(Opcode::Match32.size(), 32);
+    assert_eq!(Opcode::Match48.size(), 48);
+    assert_eq!(Opcode::Match64.size(), 64);
+    assert_eq!(Opcode::Call.size(), 8);
+    assert_eq!(Opcode::Return.size(), 8);
+}
+
+#[test]
+fn opcode_step_counts() {
+    assert_eq!(Opcode::Match8.step_count(), 1);
+    assert_eq!(Opcode::Match16.step_count(), 2);
+    assert_eq!(Opcode::Match32.step_count(), 4);
+    assert_eq!(Opcode::Match64.step_count(), 8);
+}
+
+#[test]
+fn opcode_payload_slots() {
+    assert_eq!(Opcode::Match8.payload_slots(), 0);
+    assert_eq!(Opcode::Match16.payload_slots(), 4);
+    assert_eq!(Opcode::Match24.payload_slots(), 8);
+    assert_eq!(Opcode::Match32.payload_slots(), 12);
+    assert_eq!(Opcode::Match48.payload_slots(), 20);
+    assert_eq!(Opcode::Match64.payload_slots(), 28);
+}
+
+#[test]
+fn select_match_opcode_picks_smallest() {
+    assert_eq!(select_match_opcode(0), Some(Opcode::Match8));
+    assert_eq!(select_match_opcode(1), Some(Opcode::Match16));
+    assert_eq!(select_match_opcode(4), Some(Opcode::Match16));
+    assert_eq!(select_match_opcode(5), Some(Opcode::Match24));
+    assert_eq!(select_match_opcode(12), Some(Opcode::Match32));
+    assert_eq!(select_match_opcode(20), Some(Opcode::Match48));
+    assert_eq!(select_match_opcode(28), Some(Opcode::Match64));
+    assert_eq!(select_match_opcode(29), None);
+}
+
+#[test]
+fn align_to_section_works() {
+    assert_eq!(align_to_section(0), 0);
+    assert_eq!(align_to_section(1), 64);
+    assert_eq!(align_to_section(64), 64);
+    assert_eq!(align_to_section(65), 128);
+    assert_eq!(align_to_section(100), 128);
+}
+
+#[test]
+fn match8_roundtrip() {
+    let m = Match {
+        segment: 0,
+        nav: Nav::Down,
+        node_type: NonZeroU16::new(42),
+        node_field: NonZeroU16::new(7),
+        pre_effects: vec![],
+        neg_fields: vec![],
+        post_effects: vec![],
+        successors: vec![StepId(10)],
+    };
+
+    let bytes = m.to_bytes().unwrap();
+    assert_eq!(bytes.len(), 8);
+
+    let decoded = Match::from_bytes(&bytes);
+    assert_eq!(decoded, m);
+}
+
+#[test]
+fn match8_terminal_roundtrip() {
+    let m = Match {
+        segment: 0,
+        nav: Nav::Stay,
+        node_type: None,
+        node_field: None,
+        pre_effects: vec![],
+        neg_fields: vec![],
+        post_effects: vec![],
+        successors: vec![],
+    };
+
+    let bytes = m.to_bytes().unwrap();
+    assert_eq!(bytes.len(), 8);
+
+    let decoded = Match::from_bytes(&bytes);
+    assert_eq!(decoded, m);
+    assert!(decoded.is_terminal());
+    assert!(decoded.is_epsilon());
+}
+
+#[test]
+fn match_extended_roundtrip() {
+    let m = Match {
+        segment: 0,
+        nav: Nav::Next,
+        node_type: NonZeroU16::new(100),
+        node_field: None,
+        pre_effects: vec![EffectOp {
+            opcode: EffectOpcode::S,
+            payload: 0,
+        }],
+        neg_fields: vec![5, 6],
+        post_effects: vec![
+            EffectOp {
+                opcode: EffectOpcode::Node,
+                payload: 0,
+            },
+            EffectOp {
+                opcode: EffectOpcode::Set,
+                payload: 42,
+            },
+        ],
+        successors: vec![StepId(20), StepId(30)],
+    };
+
+    let bytes = m.to_bytes().unwrap();
+    // 1 pre + 2 neg + 2 post + 2 succ = 7 slots → Match24 (8 slots capacity)
+    assert_eq!(bytes.len(), 24);
+
+    let decoded = Match::from_bytes(&bytes);
+    assert_eq!(decoded, m);
+}
+
+#[test]
+fn call_roundtrip() {
+    let c = Call {
+        segment: 0,
+        next: StepId(100),
+        target: StepId(500),
+        ref_id: 42,
+    };
+
+    let bytes = c.to_bytes();
+    let decoded = Call::from_bytes(bytes);
+    assert_eq!(decoded, c);
+}
+
+#[test]
+fn return_roundtrip() {
+    let r = Return {
+        segment: 0,
+        ref_id: 99,
+    };
+
+    let bytes = r.to_bytes();
+    let decoded = Return::from_bytes(bytes);
+    assert_eq!(decoded, r);
+}
+
+#[test]
+fn match_view_match8() {
+    let m = Match {
+        segment: 0,
+        nav: Nav::Down,
+        node_type: NonZeroU16::new(42),
+        node_field: NonZeroU16::new(7),
+        pre_effects: vec![],
+        neg_fields: vec![],
+        post_effects: vec![],
+        successors: vec![StepId(10)],
+    };
+
+    let bytes = m.to_bytes().unwrap();
+    let view = MatchView::from_bytes(&bytes);
+
+    assert_eq!(view.nav, Nav::Down);
+    assert_eq!(view.node_type, NonZeroU16::new(42));
+    assert_eq!(view.node_field, NonZeroU16::new(7));
+    assert!(!view.is_terminal());
+    assert!(!view.is_epsilon());
+    assert_eq!(view.succ_count(), 1);
+    assert_eq!(view.successor(0), StepId(10));
+    assert_eq!(view.pre_effects().count(), 0);
+    assert_eq!(view.neg_fields().count(), 0);
+    assert_eq!(view.post_effects().count(), 0);
+}
+
+#[test]
+fn match_view_terminal() {
+    let m = Match {
+        segment: 0,
+        nav: Nav::Stay,
+        node_type: None,
+        node_field: None,
+        pre_effects: vec![],
+        neg_fields: vec![],
+        post_effects: vec![],
+        successors: vec![],
+    };
+
+    let bytes = m.to_bytes().unwrap();
+    let view = MatchView::from_bytes(&bytes);
+
+    assert!(view.is_terminal());
+    assert!(view.is_epsilon());
+    assert_eq!(view.succ_count(), 0);
+}
+
+#[test]
+fn match_view_extended() {
+    let m = Match {
+        segment: 0,
+        nav: Nav::Next,
+        node_type: NonZeroU16::new(100),
+        node_field: None,
+        pre_effects: vec![EffectOp {
+            opcode: EffectOpcode::S,
+            payload: 0,
+        }],
+        neg_fields: vec![5, 6],
+        post_effects: vec![
+            EffectOp {
+                opcode: EffectOpcode::Node,
+                payload: 0,
+            },
+            EffectOp {
+                opcode: EffectOpcode::Set,
+                payload: 42,
+            },
+        ],
+        successors: vec![StepId(20), StepId(30)],
+    };
+
+    let bytes = m.to_bytes().unwrap();
+    let view = MatchView::from_bytes(&bytes);
+
+    assert_eq!(view.nav, Nav::Next);
+    assert_eq!(view.node_type, NonZeroU16::new(100));
+    assert!(!view.is_terminal());
+
+    // Check pre_effects
+    let pre: Vec<_> = view.pre_effects().collect();
+    assert_eq!(pre.len(), 1);
+    assert_eq!(pre[0].opcode, EffectOpcode::S);
+
+    // Check neg_fields
+    let neg: Vec<_> = view.neg_fields().collect();
+    assert_eq!(neg, vec![5, 6]);
+
+    // Check post_effects
+    let post: Vec<_> = view.post_effects().collect();
+    assert_eq!(post.len(), 2);
+    assert_eq!(post[0].opcode, EffectOpcode::Node);
+    assert_eq!(post[1].opcode, EffectOpcode::Set);
+    assert_eq!(post[1].payload, 42);
+
+    // Check successors
+    assert_eq!(view.succ_count(), 2);
+    assert_eq!(view.successor(0), StepId(20));
+    assert_eq!(view.successor(1), StepId(30));
+    let succs: Vec<_> = view.successors().collect();
+    assert_eq!(succs, vec![StepId(20), StepId(30)]);
+}
diff --git a/crates/plotnik-lib/src/bytecode/mod.rs b/crates/plotnik-lib/src/bytecode/mod.rs
index 9ddadd7b..1b39e286 100644
--- a/crates/plotnik-lib/src/bytecode/mod.rs
+++ b/crates/plotnik-lib/src/bytecode/mod.rs
@@ -7,6 +7,7 @@ mod effects;
 mod entrypoint;
 mod header;
 mod ids;
+mod instructions;
 mod nav;
 mod sections;
 mod type_meta;
@@ -29,3 +30,10 @@ pub use effects::{EffectOp, EffectOpcode};
 pub use entrypoint::Entrypoint;
 
 pub use type_meta::{TypeDef, TypeKind, TypeMember, TypeMetaHeader, TypeName};
+
+pub use instructions::{
+    Call, Match, MatchView, Opcode, Return, align_to_section, select_match_opcode,
+};
+
+#[cfg(test)]
+mod instructions_tests;