Skip to main content

srcmap_scopes/
encode.rs

1//! Encoder for the ECMA-426 scopes proposal.
2//!
3//! Encodes structured `ScopeInfo` into a VLQ-encoded `scopes` string.
4
5use std::collections::HashMap;
6
7use srcmap_codec::{vlq_encode, vlq_encode_unsigned};
8
9use crate::{
10    Binding, GeneratedRange, OriginalScope, ScopeInfo, TAG_GENERATED_RANGE_BINDINGS,
11    TAG_GENERATED_RANGE_CALL_SITE, TAG_GENERATED_RANGE_END, TAG_GENERATED_RANGE_START,
12    TAG_GENERATED_RANGE_SUB_RANGE_BINDINGS, TAG_ORIGINAL_SCOPE_END, TAG_ORIGINAL_SCOPE_START,
13    TAG_ORIGINAL_SCOPE_VARIABLES, resolve_or_add_name,
14};
15
16// ── Encoder ──────────────────────────────────────────────────────
17
18struct ScopesEncoder<'a> {
19    output: Vec<u8>,
20    names: &'a mut Vec<String>,
21    name_map: HashMap<String, u32>,
22    first_item: bool,
23
24    // Original scope relative state
25    os_line: u32,
26    os_col: u32,
27    os_name: i64,
28    os_kind: i64,
29    os_var: i64,
30
31    // Generated range relative state
32    gr_line: u32,
33    gr_col: u32,
34    gr_def: i64,
35}
36
37impl<'a> ScopesEncoder<'a> {
38    fn new(names: &'a mut Vec<String>) -> Self {
39        let name_map: HashMap<String, u32> =
40            names.iter().enumerate().map(|(i, n)| (n.clone(), i as u32)).collect();
41
42        Self {
43            output: Vec::with_capacity(256),
44            names,
45            name_map,
46            first_item: true,
47            os_line: 0,
48            os_col: 0,
49            os_name: 0,
50            os_kind: 0,
51            os_var: 0,
52            gr_line: 0,
53            gr_col: 0,
54            gr_def: 0,
55        }
56    }
57
58    #[inline]
59    fn emit_comma(&mut self) {
60        if !self.first_item {
61            self.output.push(b',');
62        }
63        self.first_item = false;
64    }
65
66    #[inline]
67    fn emit_tag(&mut self, tag: u64) {
68        vlq_encode_unsigned(&mut self.output, tag);
69    }
70
71    #[inline]
72    fn emit_unsigned(&mut self, value: u64) {
73        vlq_encode_unsigned(&mut self.output, value);
74    }
75
76    #[inline]
77    fn emit_signed(&mut self, value: i64) {
78        vlq_encode(&mut self.output, value);
79    }
80
81    #[inline]
82    fn name_idx(&mut self, name: &str) -> u32 {
83        resolve_or_add_name(name, self.names, &mut self.name_map)
84    }
85
86    fn encode(mut self, info: &ScopeInfo) -> String {
87        // Phase 1: Encode original scope trees
88        for scope in &info.scopes {
89            match scope {
90                Some(s) => {
91                    // Reset position state for new top-level tree
92                    self.os_line = 0;
93                    self.os_col = 0;
94                    self.encode_original_scope(s);
95                }
96                None => {
97                    // Empty item: emit a comma to mark the absent source
98                    self.emit_comma();
99                }
100            }
101        }
102
103        // Phase 2: Encode generated ranges
104        for range in &info.ranges {
105            self.encode_generated_range(range);
106        }
107
108        debug_assert!(self.output.is_ascii());
109        // SAFETY: vlq_encode/vlq_encode_unsigned only push bytes from
110        // BASE64_ENCODE (all ASCII), and we only add b',' — all valid UTF-8.
111        unsafe { String::from_utf8_unchecked(self.output) }
112    }
113
114    fn encode_original_scope(&mut self, scope: &OriginalScope) {
115        // B item: scope start
116        self.emit_comma();
117        self.emit_tag(TAG_ORIGINAL_SCOPE_START);
118
119        let mut flags: u64 = 0;
120        if scope.name.is_some() {
121            flags |= crate::OS_FLAG_HAS_NAME;
122        }
123        if scope.kind.is_some() {
124            flags |= crate::OS_FLAG_HAS_KIND;
125        }
126        if scope.is_stack_frame {
127            flags |= crate::OS_FLAG_IS_STACK_FRAME;
128        }
129        self.emit_unsigned(flags);
130
131        // Line (relative)
132        let line_delta = scope.start.line - self.os_line;
133        self.emit_unsigned(line_delta as u64);
134        self.os_line = scope.start.line;
135
136        // Column (absolute if line changed, relative if same line)
137        let col =
138            if line_delta != 0 { scope.start.column } else { scope.start.column - self.os_col };
139        self.emit_unsigned(col as u64);
140        self.os_col = scope.start.column;
141
142        // Name (signed relative)
143        if let Some(ref name) = scope.name {
144            let idx = self.name_idx(name) as i64;
145            self.emit_signed(idx - self.os_name);
146            self.os_name = idx;
147        }
148
149        // Kind (signed relative)
150        if let Some(ref kind) = scope.kind {
151            let idx = self.name_idx(kind) as i64;
152            self.emit_signed(idx - self.os_kind);
153            self.os_kind = idx;
154        }
155
156        // D item: variables
157        if !scope.variables.is_empty() {
158            self.emit_comma();
159            self.emit_tag(TAG_ORIGINAL_SCOPE_VARIABLES);
160            for var in &scope.variables {
161                let idx = self.name_idx(var) as i64;
162                self.emit_signed(idx - self.os_var);
163                self.os_var = idx;
164            }
165        }
166
167        // Recursively encode children
168        for child in &scope.children {
169            self.encode_original_scope(child);
170        }
171
172        // C item: scope end
173        self.emit_comma();
174        self.emit_tag(TAG_ORIGINAL_SCOPE_END);
175
176        let line_delta = scope.end.line - self.os_line;
177        self.emit_unsigned(line_delta as u64);
178        self.os_line = scope.end.line;
179
180        let col = if line_delta != 0 { scope.end.column } else { scope.end.column - self.os_col };
181        self.emit_unsigned(col as u64);
182        self.os_col = scope.end.column;
183    }
184
185    fn encode_generated_range(&mut self, range: &GeneratedRange) {
186        // E item: range start
187        self.emit_comma();
188        self.emit_tag(TAG_GENERATED_RANGE_START);
189
190        let line_delta = range.start.line - self.gr_line;
191
192        let mut flags: u64 = 0;
193        if line_delta != 0 {
194            flags |= crate::GR_FLAG_HAS_LINE;
195        }
196        if range.definition.is_some() {
197            flags |= crate::GR_FLAG_HAS_DEFINITION;
198        }
199        if range.is_stack_frame {
200            flags |= crate::GR_FLAG_IS_STACK_FRAME;
201        }
202        if range.is_hidden {
203            flags |= crate::GR_FLAG_IS_HIDDEN;
204        }
205        self.emit_unsigned(flags);
206
207        if line_delta != 0 {
208            self.emit_unsigned(line_delta as u64);
209        }
210        self.gr_line = range.start.line;
211
212        let col =
213            if line_delta != 0 { range.start.column } else { range.start.column - self.gr_col };
214        self.emit_unsigned(col as u64);
215        self.gr_col = range.start.column;
216
217        if let Some(def) = range.definition {
218            let def_val = def as i64;
219            self.emit_signed(def_val - self.gr_def);
220            self.gr_def = def_val;
221        }
222
223        // G item: bindings
224        if !range.bindings.is_empty() {
225            self.emit_comma();
226            self.emit_tag(TAG_GENERATED_RANGE_BINDINGS);
227            for binding in &range.bindings {
228                match binding {
229                    Binding::Expression(expr) => {
230                        let idx = self.name_idx(expr);
231                        self.emit_unsigned(idx as u64 + 1); // 1-based
232                    }
233                    Binding::Unavailable => {
234                        self.emit_unsigned(0);
235                    }
236                    Binding::SubRanges(subs) => {
237                        // G gets the first sub-range's binding
238                        if let Some(first) = subs.first() {
239                            match &first.expression {
240                                Some(expr) => {
241                                    let idx = self.name_idx(expr);
242                                    self.emit_unsigned(idx as u64 + 1);
243                                }
244                                None => {
245                                    self.emit_unsigned(0);
246                                }
247                            }
248                        } else {
249                            self.emit_unsigned(0);
250                        }
251                    }
252                }
253            }
254        }
255
256        // H items: sub-range bindings
257        let mut h_var_idx = 0u64;
258        for (i, binding) in range.bindings.iter().enumerate() {
259            if let Binding::SubRanges(subs) = binding
260                && subs.len() > 1
261            {
262                self.emit_comma();
263                self.emit_tag(TAG_GENERATED_RANGE_SUB_RANGE_BINDINGS);
264
265                // Variable index (relative to previous H item, or 0 for the first)
266                let var_delta = i as u64 - h_var_idx;
267                self.emit_unsigned(var_delta);
268                h_var_idx = i as u64;
269
270                // Sub-range line/col state (relative to range start)
271                let mut h_line = range.start.line;
272                let mut h_col = range.start.column;
273
274                // Skip first sub-range (that's in G), encode the rest
275                for sub in &subs[1..] {
276                    // Binding (1-based absolute)
277                    match &sub.expression {
278                        Some(expr) => {
279                            let idx = self.name_idx(expr);
280                            self.emit_unsigned(idx as u64 + 1);
281                        }
282                        None => {
283                            self.emit_unsigned(0);
284                        }
285                    }
286
287                    let sub_line_delta = sub.from.line - h_line;
288                    self.emit_unsigned(sub_line_delta as u64);
289                    h_line = sub.from.line;
290
291                    let sub_col =
292                        if sub_line_delta != 0 { sub.from.column } else { sub.from.column - h_col };
293                    self.emit_unsigned(sub_col as u64);
294                    h_col = sub.from.column;
295                }
296            }
297        }
298
299        // I item: call site
300        if let Some(ref cs) = range.call_site {
301            self.emit_comma();
302            self.emit_tag(TAG_GENERATED_RANGE_CALL_SITE);
303            self.emit_unsigned(cs.source_index as u64);
304            self.emit_unsigned(cs.line as u64);
305            self.emit_unsigned(cs.column as u64);
306        }
307
308        // Recursively encode children
309        for child in &range.children {
310            self.encode_generated_range(child);
311        }
312
313        // F item: range end
314        self.emit_comma();
315        self.emit_tag(TAG_GENERATED_RANGE_END);
316
317        let line_delta = range.end.line - self.gr_line;
318        if line_delta != 0 {
319            self.emit_unsigned(line_delta as u64);
320        }
321        self.gr_line = range.end.line;
322
323        let col = if line_delta != 0 { range.end.column } else { range.end.column - self.gr_col };
324        self.emit_unsigned(col as u64);
325        self.gr_col = range.end.column;
326    }
327}
328
329/// Encode scope information into a VLQ-encoded `scopes` string.
330///
331/// New names may be added to the `names` array during encoding.
332pub fn encode_scopes(info: &ScopeInfo, names: &mut Vec<String>) -> String {
333    let encoder = ScopesEncoder::new(names);
334    encoder.encode(info)
335}