plotnik-lang · zharinov · Jan 15, 2026 · Jan 15, 2026
diff --git a/crates/plotnik-compiler/src/bytecode/ir.rs b/crates/plotnik-compiler/src/bytecode/ir.rs
@@ -606,11 +606,20 @@ impl MatchIR {
             // counts layout: pre(3) | neg(3) | post(3) | succ(5) | has_pred(1) | reserved(1)
             assert!(
                 pre_count <= 7,
-                "pre_effects overflow: {pre_count} > 7 (use emit_match_with_cascade)"
+                "pre_effects overflow: {pre_count} > 7 (lowering should have cascaded)"
+            );
+            assert!(
+                neg_count <= 7,
+                "neg_fields overflow: {neg_count} > 7 (lowering should have cascaded)"
+            );
+            assert!(
+                post_count <= 7,
+                "post_effects overflow: {post_count} > 7 (lowering should have cascaded)"
+            );
+            assert!(
+                succ_count <= 31,
+                "successors overflow: {succ_count} > 31 (lowering should have cascaded)"
             );
-            assert!(neg_count <= 7, "neg_fields overflow: {neg_count} > 7");
-            assert!(post_count <= 7, "post_effects overflow: {post_count} > 7");
-            assert!(succ_count <= 31, "successors overflow: {succ_count} > 31");
 
             let counts = ((pre_count as u16) << 13)
                 | ((neg_count as u16) << 10)

diff --git a/crates/plotnik-compiler/src/compile/compiler.rs b/crates/plotnik-compiler/src/compile/compiler.rs
@@ -15,6 +15,7 @@ use plotnik_bytecode::Nav;
 use super::capture::CaptureEffects;
 use super::dce::remove_unreachable;
 use super::epsilon_elim::eliminate_epsilons;
+use super::lower::lower;
 use super::error::{CompileError, CompileResult};
 use super::scope::StructScope;
 use super::verify::debug_verify_ir_fingerprint;
@@ -86,6 +87,9 @@ impl<'a> Compiler<'a> {
         // Remove unreachable instructions (bypassed epsilons, etc.)
         remove_unreachable(&mut result);
 
+        // Lower to bytecode-compatible form (cascade overflows)
+        lower(&mut result);
+
         Ok(result)
     }
 

diff --git a/crates/plotnik-compiler/src/compile/expressions.rs b/crates/plotnik-compiler/src/compile/expressions.rs
@@ -49,7 +49,7 @@ impl Compiler<'_> {
             if let Some(p) = predicate {
                 m = m.predicate(p);
             }
-            return self.emit_match_with_cascade(m);
+            return self.emit_match(m);
         }
 
         // Determine Up navigation based on trailing anchor
@@ -123,7 +123,7 @@ impl Compiler<'_> {
         if let Some(p) = predicate {
             entry_match = entry_match.predicate(p);
         }
-        self.emit_match_with_cascade(entry_match);
+        self.emit_match(entry_match);
 
         entry
     }
@@ -201,7 +201,7 @@ impl Compiler<'_> {
         if let Some(p) = predicate {
             entry_match = entry_match.predicate(p);
         }
-        self.emit_match_with_cascade(entry_match);
+        self.emit_match(entry_match);
 
         entry
     }
@@ -236,7 +236,7 @@ impl Compiler<'_> {
             None => NodeTypeIR::Any, // `_` wildcard matches any node
         };
 
-        self.emit_match_with_cascade(
+        self.emit_match(
             MatchIR::epsilon(entry, exit)
                 .nav(nav)
                 .node_type(node_type)

diff --git a/crates/plotnik-compiler/src/compile/lower.rs b/crates/plotnik-compiler/src/compile/lower.rs
@@ -0,0 +1,206 @@
+//! Lowering pass: transforms unconstrained IR into bytecode-compatible form.
+//!
+//! This pass handles bytecode encoding constraints by splitting oversized
+//! instructions into cascading epsilon chains:
+//! - pre_effects > 7 → epsilon chain before match
+//! - post_effects > 7 → epsilon chain after match
+//! - neg_fields > 7 → epsilon chain for overflow checks
+//! - successors > 28 → cascading epsilon branches
+
+use plotnik_bytecode::{MAX_MATCH_PAYLOAD_SLOTS, MAX_PRE_EFFECTS};
+
+use crate::bytecode::{EffectIR, InstructionIR, Label, MatchIR};
+use crate::compile::CompileResult;
+
+const MAX_POST_EFFECTS: usize = 7;
+const MAX_NEG_FIELDS: usize = 7;
+
+enum PostChain {
+    NegFields(Vec<u16>),
+    PostEffects(Vec<EffectIR>),
+    Successors(Vec<Label>),
+}
+
+/// Lower IR to bytecode-compatible form.
+///
+/// Transforms instructions that exceed bytecode encoding limits into
+/// equivalent cascades of smaller instructions.
+pub fn lower(result: &mut CompileResult) {
+    let mut next_label = result
+        .instructions
+        .iter()
+        .map(|i| i.label().0)
+        .max()
+        .unwrap_or(0)
+        + 1;
+
+    let mut new_instructions = Vec::with_capacity(result.instructions.len());
+
+    for instr in result.instructions.drain(..) {
+        let InstructionIR::Match(m) = instr else {
+            new_instructions.push(instr);
+            continue;
+        };
+        lower_match(m, &mut new_instructions, &mut next_label);
+    }
+
+    result.instructions = new_instructions;
+}
+
+fn fresh_label(next: &mut u32) -> Label {
+    let l = Label(*next);
+    *next += 1;
+    l
+}
+
+fn lower_match(mut m: MatchIR, out: &mut Vec<InstructionIR>, next_label: &mut u32) {
+    // Step 1: Handle pre_effects overflow → epsilon chain before the match
+    if m.pre_effects.len() > MAX_PRE_EFFECTS {
+        let all_pre = std::mem::take(&mut m.pre_effects);
+        let entry = m.label;
+        m.label = fresh_label(next_label);
+        emit_effects_chain(entry, m.label, all_pre, out, next_label);
+    }
+
+    // Collect overflow chains to emit after the match
+    let mut post_chains: Vec<PostChain> = Vec::new();
+
+    if m.neg_fields.len() > MAX_NEG_FIELDS {
+        let overflow: Vec<_> = m.neg_fields.drain(MAX_NEG_FIELDS..).collect();
+        post_chains.push(PostChain::NegFields(overflow));
+    }
+
+    if m.post_effects.len() > MAX_POST_EFFECTS {
+        let overflow: Vec<_> = m.post_effects.drain(MAX_POST_EFFECTS..).collect();
+        post_chains.push(PostChain::PostEffects(overflow));
+    }
+
+    if m.successors.len() > MAX_MATCH_PAYLOAD_SLOTS {
+        let overflow: Vec<_> = m.successors.drain(MAX_MATCH_PAYLOAD_SLOTS - 1..).collect();
+        post_chains.push(PostChain::Successors(overflow));
+    }
+
+    if post_chains.is_empty() {
+        out.push(m.into());
+        return;
+    }
+
+    // Build chain: match → chain1 → chain2 → ... → final_succs
+    let mut current_succs = std::mem::take(&mut m.successors);
+
+    for chain in post_chains.into_iter().rev() {
+        let chain_entry = fresh_label(next_label);
+        match chain {
+            PostChain::NegFields(neg_fields) => {
+                emit_neg_fields_chain(chain_entry, current_succs, neg_fields, out, next_label);
+            }
+            PostChain::PostEffects(effects) => {
+                emit_effects_chain_to_succs(chain_entry, current_succs, effects, out, next_label);
+            }
+            PostChain::Successors(succs) => {
+                emit_successors_cascade(chain_entry, succs, out, next_label);
+                current_succs = vec![chain_entry];
+                continue;
+            }
+        }
+        current_succs = vec![chain_entry];
+    }
+
+    m.successors = current_succs;
+    out.push(m.into());
+}
+
+fn emit_effects_chain(
+    entry: Label,
+    exit: Label,
+    mut effects: Vec<EffectIR>,
+    out: &mut Vec<InstructionIR>,
+    next_label: &mut u32,
+) {
+    if effects.is_empty() {
+        out.push(MatchIR::epsilon(entry, exit).into());
+        return;
+    }
+
+    if effects.len() <= MAX_PRE_EFFECTS {
+        out.push(MatchIR::epsilon(entry, exit).pre_effects(effects).into());
+        return;
+    }
+
+    let first_batch: Vec<_> = effects.drain(..MAX_PRE_EFFECTS).collect();
+    let intermediate = fresh_label(next_label);
+    out.push(
+        MatchIR::epsilon(entry, intermediate)
+            .pre_effects(first_batch)
+            .into(),
+    );
+    emit_effects_chain(intermediate, exit, effects, out, next_label);
+}
+
+fn emit_neg_fields_chain(
+    entry: Label,
+    final_succs: Vec<Label>,
+    mut neg_fields: Vec<u16>,
+    out: &mut Vec<InstructionIR>,
+    next_label: &mut u32,
+) {
+    if neg_fields.len() <= MAX_NEG_FIELDS {
+        let mut m = MatchIR::at(entry).neg_fields(neg_fields);
+        m.successors = final_succs;
+        out.push(m.into());
+        return;
+    }
+
+    let first_batch: Vec<_> = neg_fields.drain(..MAX_NEG_FIELDS).collect();
+    let intermediate = fresh_label(next_label);
+    out.push(
+        MatchIR::at(entry)
+            .neg_fields(first_batch)
+            .next(intermediate)
+            .into(),
+    );
+    emit_neg_fields_chain(intermediate, final_succs, neg_fields, out, next_label);
+}
+
+fn emit_effects_chain_to_succs(
+    entry: Label,
+    final_succs: Vec<Label>,
+    mut effects: Vec<EffectIR>,
+    out: &mut Vec<InstructionIR>,
+    next_label: &mut u32,
+) {
+    if effects.len() <= MAX_POST_EFFECTS {
+        let mut m = MatchIR::at(entry).post_effects(effects);
+        m.successors = final_succs;
+        out.push(m.into());
+        return;
+    }
+
+    let first_batch: Vec<_> = effects.drain(..MAX_POST_EFFECTS).collect();
+    let intermediate = fresh_label(next_label);
+    out.push(
+        MatchIR::at(entry)
+            .post_effects(first_batch)
+            .next(intermediate)
+            .into(),
+    );
+    emit_effects_chain_to_succs(intermediate, final_succs, effects, out, next_label);
+}
+
+fn emit_successors_cascade(
+    entry: Label,
+    mut succs: Vec<Label>,
+    out: &mut Vec<InstructionIR>,
+    next_label: &mut u32,
+) {
+    if succs.len() <= MAX_MATCH_PAYLOAD_SLOTS {
+        out.push(MatchIR::at(entry).next_many(succs).into());
+        return;
+    }
+
+    let overflow: Vec<_> = succs.drain(MAX_MATCH_PAYLOAD_SLOTS - 1..).collect();
+    let intermediate = fresh_label(next_label);
+    succs.push(intermediate);
+    out.push(MatchIR::at(entry).next_many(succs).into());
+    emit_successors_cascade(intermediate, overflow, out, next_label);
+}