lex_bytecode/verify.rs
1//! Bytecode stack-depth verifier — the third `--strict` check from #347 A2.
2//!
3//! Walks every function's instruction stream, tracking the abstract stack
4//! depth through each opcode and branch. Reports a `StackError` when two
5//! paths into the same program counter carry different depths, which would
6//! mean a prior match arm leaked (or over-consumed) values and left the
7//! stack in an inconsistent state for subsequent arms.
8//!
9//! The check is lightweight: it is a single linear pass with a small
10//! worklist. No allocation beyond `Vec` is needed.
11//!
12//! # Known sound over-approximation
13//!
14//! `Return` and `Panic` terminate the function; their successors are not
15//! added to the worklist. `TailCall` is treated like `Return`. This means
16//! dead code after a `Return` / `Panic` is not checked — intentional.
17
18use crate::op::Op;
19use crate::program::Function;
20
21#[derive(Debug, Clone, PartialEq)]
22pub struct StackError {
23 pub fn_name: String,
24 pub pc: usize,
25 pub depth_a: i32,
26 pub depth_b: i32,
27}
28
29impl std::fmt::Display for StackError {
30 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
31 write!(
32 f,
33 "stack depth mismatch in `{}` at pc {}: path A leaves depth {}, path B leaves depth {}",
34 self.fn_name, self.pc, self.depth_a, self.depth_b
35 )
36 }
37}
38
39/// Verify all functions in a slice. Returns one error per inconsistent
40/// merge point found.
41pub fn verify_program(functions: &[Function]) -> Vec<StackError> {
42 let mut errors = Vec::new();
43 for func in functions {
44 verify_function(func, &mut errors);
45 }
46 errors
47}
48
49/// Verify a single function. Appends to `errors`.
50pub fn verify_function(func: &Function, errors: &mut Vec<StackError>) {
51 let n = func.code.len();
52 if n == 0 {
53 return;
54 }
55
56 // `depths[pc]` = known stack depth at that pc, or `None` if not yet visited.
57 let mut depths: Vec<Option<i32>> = vec![None; n];
58
59 // Worklist: (pc, stack_depth_on_entry_to_this_instruction)
60 let mut worklist: Vec<(usize, i32)> = vec![(0, 0)];
61
62 while let Some((pc, depth)) = worklist.pop() {
63 if pc >= n {
64 continue;
65 }
66
67 // Merge-point check.
68 if let Some(prev) = depths[pc] {
69 if prev != depth {
70 errors.push(StackError {
71 fn_name: func.name.clone(),
72 pc,
73 depth_a: prev,
74 depth_b: depth,
75 });
76 }
77 // Already processed from this depth (or recorded mismatch).
78 continue;
79 }
80 depths[pc] = Some(depth);
81
82 let op = &func.code[pc];
83 let delta = stack_delta(op);
84 let next_depth = depth + delta;
85
86 match op {
87 // Unconditional jumps: only the target is a successor.
88 Op::Jump(off) => {
89 let target = (pc as i32 + 1 + off) as usize;
90 worklist.push((target, next_depth));
91 }
92 // Conditional jumps: fall-through and jump target are both successors.
93 // Note: JumpIf / JumpIfNot pop the Bool before branching, so `delta`
94 // already accounts for that (-1). Both successors start at next_depth.
95 Op::JumpIf(off) | Op::JumpIfNot(off) => {
96 let target = (pc as i32 + 1 + off) as usize;
97 worklist.push((pc + 1, next_depth));
98 worklist.push((target, next_depth));
99 }
100 // Terminators: no successors.
101 Op::Return | Op::TailCall { .. } | Op::Panic(_) => {}
102 // Slice-2 superinstruction (#461) owns 4 slots: the fused
103 // op + 3 tombstones (original PushConst + IntAdd +
104 // StoreLocal). The trailing tombstones' deltas don't
105 // cancel (+1, -1, -1 = -1), so we can't let the verifier
106 // walk them as live — it'd drift the depth at pc+4 vs the
107 // pre-fusion form. Skip directly to pc+4 with the
108 // unfused-equivalent depth.
109 Op::LoadLocalAddIntConstStoreLocal { .. } => {
110 worklist.push((pc + 4, next_depth));
111 }
112 // Slice-5 superinstructions (#461) — jump-aware fusion of
113 // `LoadLocal + LoadLocal|PushConst + IntLt + JumpIfNot`.
114 // 4-slot window like slice 2 but with TWO successors
115 // (fall-through and branch target). Tombstones' deltas
116 // (+1 LoadLocal/PushConst, -1 IntLt, -1 JumpIfNot = -1
117 // total) don't cancel — skip past in the same shape as
118 // slice 2's worklist override. The branch target's
119 // offset is relative to the JumpIfNot's `pc + 1`, which
120 // in the fused position is `pc + 4`.
121 Op::LoadLocalEqIntConstJumpIfNot { jump_offset, .. } => {
122 let target = (pc as i32 + 4 + jump_offset) as usize;
123 worklist.push((pc + 4, next_depth));
124 worklist.push((target, next_depth));
125 }
126 // Slice 6 owns a 6-slot window (this op + 5 tombstones).
127 // Same two-successor shape as slice 5 but with `pc + 6`
128 // arithmetic. Net stack delta is 0 — original was
129 // LoadLocal + StoreLocal + slice5 = +1 + -1 + 0.
130 Op::LoadLocalStoreEqIntConstJumpIfNot { jump_offset, .. } => {
131 let target = (pc as i32 + 6 + jump_offset) as usize;
132 worklist.push((pc + 6, next_depth));
133 worklist.push((target, next_depth));
134 }
135 // All other ops: single sequential successor.
136 _ => {
137 worklist.push((pc + 1, next_depth));
138 }
139 }
140 }
141}
142
143/// Returns the net change in stack depth caused by `op`.
144///
145/// Positive = pushes more than it pops.
146/// Negative = pops more than it pushes.
147fn stack_delta(op: &Op) -> i32 {
148 match op {
149 // Stack manipulation
150 Op::PushConst(_) => 1,
151 Op::Pop => -1,
152 Op::Dup => 1,
153
154 // Locals
155 Op::LoadLocal(_) => 1,
156 Op::StoreLocal(_) => -1,
157
158 // Record / tuple / list construction
159 Op::MakeRecord { field_count, .. } => -(*field_count as i32) + 1,
160 // #464 step 2: same stack-effect shape as MakeRecord (pops
161 // field_count, pushes 1). The verifier doesn't need to know
162 // about the stack-record arena — it walks bytecode shape only.
163 Op::AllocStackRecord { field_count, .. } => -(*field_count as i32) + 1,
164 Op::MakeTuple(n) => -(*n as i32) + 1,
165 // #464 tuple codegen: same stack-effect shape as MakeTuple.
166 Op::AllocStackTuple { arity } => -(*arity as i32) + 1,
167 Op::MakeList(n) => -(*n as i32) + 1,
168 Op::MakeVariant { arity, .. } => -(*arity as i32) + 1,
169
170 // Field/element access: pop 1, push 1
171 Op::GetField { .. } => 0,
172 Op::GetElem(_) => 0,
173 Op::GetListElem(_) => 0,
174 Op::GetListLen => 0,
175
176 // Variant ops: pop 1, push 1
177 Op::TestVariant(_) => 0,
178 Op::GetVariant(_) => 0,
179 Op::GetVariantArg(_)=> 0,
180
181 // Binary list ops: pop 2, push 1
182 Op::ListAppend => -1,
183 Op::GetListElemDyn => -1,
184
185 // Jumps: delta handled in the control-flow logic above; use 0 here
186 // so that next_depth = depth + 0 is the "effective post-instruction depth"
187 // before branching. The successor depths are added by the control-flow arms.
188 Op::Jump(_) | Op::JumpIf(_) | Op::JumpIfNot(_) => {
189 // JumpIf/JumpIfNot pop the Bool.
190 match op {
191 Op::JumpIf(_) | Op::JumpIfNot(_) => -1,
192 _ => 0,
193 }
194 }
195
196 // Calls: pop arity args, push 1 result
197 Op::Call { arity, .. } => -(*arity as i32) + 1,
198 Op::TailCall { arity, .. } => -(*arity as i32) + 1,
199 Op::CallClosure { arity, .. }=> -(*arity as i32 + 1) + 1, // also pops closure
200 Op::EffectCall { arity, .. } => -(*arity as i32) + 1,
201
202 // Closure construction: pop captures, push closure
203 Op::MakeClosure { capture_count, .. } => -(*capture_count as i32) + 1,
204
205 // Higher-order ops: pop list + fn, push result list
206 Op::SortByKey { .. } => -1,
207 Op::ParallelMap { .. }=> -1,
208 // #464 native list builders. map/filter pop [xs, f] push 1;
209 // fold pops [xs, init, f] push 1.
210 Op::ListMap { .. } => -1,
211 Op::ListFilter { .. } => -1,
212 Op::ListFold { .. } => -2,
213
214 // Terminators
215 Op::Return => -1, // pop return value
216 Op::Panic(_)=> 0, // does not matter (no successor)
217
218 // Arithmetic / comparison — all binary except Neg/Not
219 Op::IntAdd | Op::IntSub | Op::IntMul | Op::IntDiv | Op::IntMod => -1,
220 Op::IntEq | Op::IntLt | Op::IntLe => -1,
221 Op::IntNeg => 0,
222
223 Op::FloatAdd | Op::FloatSub | Op::FloatMul | Op::FloatDiv => -1,
224 Op::FloatEq | Op::FloatLt | Op::FloatLe => -1,
225 Op::FloatNeg => 0,
226
227 Op::NumAdd | Op::NumSub | Op::NumMul | Op::NumDiv | Op::NumMod => -1,
228 Op::NumEq | Op::NumLt | Op::NumLe => -1,
229 Op::NumNeg => 0,
230
231 Op::BoolAnd | Op::BoolOr => -1,
232 Op::BoolNot => 0,
233
234 Op::StrConcat => -1,
235 Op::StrLen => 0,
236 Op::StrEq => -1,
237 Op::BytesLen => 0,
238 Op::BytesEq => -1,
239
240 // Superinstructions (#461). The fused op contributes its
241 // net delta (+1, same shape as a bare LoadLocal). The two
242 // inert primitive ops the peephole leaves at pc+1 / pc+2
243 // are walked as if live: their deltas (+1 PushConst, -1
244 // IntAdd) cancel, so the depth at pc+3 matches what the
245 // unfused sequence would have produced.
246 Op::LoadLocalAddIntConst { .. } => 1,
247 // Slice-2 fused op: src → dest with no net stack effect.
248 // Tombstones at the next 3 slots are *not* walked (see the
249 // control-flow successor logic in `verify_function`).
250 Op::LoadLocalAddIntConstStoreLocal { .. } => 0,
251 // Slice-3 fused op: LoadLocal(lhs) + LoadLocal(rhs) + IntAdd.
252 // Net delta +1 (pushes the sum). The trailing tombstones
253 // (LoadLocal + IntAdd) have deltas +1 and -1 — they cancel
254 // when walked as live, mirroring slice 1's shape.
255 Op::LoadLocalAddLocal { .. } => 1,
256 // Slice-4 fused ops: identical shape to slice 3, just with
257 // IntSub / IntMul as terminator. Net delta +1; trailing
258 // LoadLocal + IntSub|IntMul tombstones cancel when walked.
259 Op::LoadLocalSubLocal { .. } | Op::LoadLocalMulLocal { .. } => 1,
260 // Slice-5 fused ops: 4-slot window with net stack delta 0
261 // (original sequence had +1, +1, -1, -1). Worklist override
262 // above pushes both fall-through and branch successors with
263 // this depth; tombstones are not walked as live.
264 Op::LoadLocalEqIntConstJumpIfNot { .. }
265 | Op::LoadLocalStoreEqIntConstJumpIfNot { .. } => 0,
266 // Slice-7/8 fused ops (#461): net +1, same as bare LoadLocal.
267 // Trailing GetField (delta 0) + IntAdd/IntSub/IntMul (delta
268 // -1) tombstones cancel to -1 when walked, leaving depth at
269 // pc+3 matching the unfused [LoadLocal, GetField, <op>]
270 // sequence's overall delta of 0.
271 Op::LoadLocalGetFieldAdd { .. }
272 | Op::LoadLocalGetFieldSub { .. }
273 | Op::LoadLocalGetFieldMul { .. } => 1,
274 // Slice-9 fused op (#461): net +1 (LoadLocal +1, GetField 0),
275 // same as bare LoadLocal. The single trailing GetField
276 // tombstone (delta 0) leaves depth at pc+2 matching the
277 // unfused [LoadLocal, GetField] pair.
278 Op::LoadLocalGetField { .. } => 1,
279 }
280}
281
282#[cfg(test)]
283mod tests {
284 use super::*;
285 use crate::op::Op;
286 use crate::program::Function;
287
288 fn make_fn(name: &str, code: Vec<Op>) -> Function {
289 Function {
290 name: name.to_string(),
291 arity: 0,
292 locals_count: 4,
293 code,
294 effects: vec![],
295 body_hash: crate::program::ZERO_BODY_HASH,
296 refinements: vec![],
297 field_ic_sites: 0,
298 }
299 }
300
301 #[test]
302 fn clean_match_no_errors() {
303 // Simulates a two-arm match that is properly balanced:
304 // LoadLocal(0) ; push scrutinee depth=1
305 // Dup ; dup depth=2
306 // TestVariant("Ok") ; pop+push Bool depth=2
307 // JumpIfNot(+3) ; pop Bool, fall or jump depth=1
308 // Pop ; pop scrutinee depth=0
309 // PushConst(0) ; push result depth=1
310 // Jump(+2) ; to end depth=1
311 // Pop ; pop scrutinee (wildcard arm) depth=0
312 // PushConst(1) ; push result depth=1
313 // Return ; end depth=0
314 let code = vec![
315 Op::LoadLocal(0), // pc 0, depth 0→1
316 Op::Dup, // pc 1, depth 1→2
317 Op::TestVariant(0), // pc 2, depth 2→2
318 Op::JumpIfNot(3), // pc 3, depth 2→1; target=pc7
319 Op::Pop, // pc 4, depth 1→0
320 Op::PushConst(0), // pc 5, depth 0→1
321 Op::Jump(2), // pc 6, depth 1→1; target=pc9
322 Op::Pop, // pc 7, depth 1→0 (wildcard arm)
323 Op::PushConst(1), // pc 8, depth 0→1
324 Op::Return, // pc 9, depth 1→0
325 ];
326 let f = make_fn("clean", code);
327 let mut errs = Vec::new();
328 verify_function(&f, &mut errs);
329 assert!(errs.is_empty(), "expected no errors, got: {errs:?}");
330 }
331
332 #[test]
333 fn leaked_scrutinee_detected() {
334 // Two paths reach pc6 at different depths — mismatch detected.
335 // Fall path: pc2→pc3→pc6 at depth 1.
336 // Jump path: pc4→pc5→pc6 at depth 2 (extra push leaks).
337 let mismatch2 = vec![
338 Op::PushConst(0), // pc0 depth 0→1
339 Op::JumpIfNot(2), // pc1 depth 1→0; fall=pc2 depth0, jump=pc4 depth0
340 Op::PushConst(0), // pc2 depth 0→1
341 Op::Jump(2), // pc3 target=pc6, depth=1
342 Op::PushConst(0), // pc4 depth 0→1
343 Op::PushConst(0), // pc5 depth 1→2
344 Op::Return, // pc6: reached at depth=1 (from pc3) AND depth=2 (from pc5+fall)
345 ];
346 let f2 = make_fn("mismatch", mismatch2);
347 let mut errs2 = Vec::new();
348 verify_function(&f2, &mut errs2);
349 assert!(!errs2.is_empty(), "expected stack mismatch error");
350 assert_eq!(errs2[0].fn_name, "mismatch");
351 }
352}