1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
use std::borrow::Cow;
use rustc_hash::{FxHashMap, FxHashSet};
use oxc_ast::{Comment, CommentKind, ast::Program};
use oxc_syntax::line_terminator::LineTerminatorSplitter;
use crate::{Codegen, LegalComment, options::CommentOptions};
pub type CommentsMap = FxHashMap</* attached_to */ u32, Vec<Comment>>;
/// Which annotation kind an emission site expects to recover from
/// [`Codegen::annotation_comments`].
///
/// `@__PURE__` / `#__PURE__` on a `CallExpression` or `NewExpression`, and
/// `@__NO_SIDE_EFFECTS__` / `#__NO_SIDE_EFFECTS__` on a function declaration or
/// expression, are not interchangeable: downstream tree-shakers only honor
/// each on its corresponding node kind. The filter prevents
/// [`Codegen::print_annotation_comment`] from emitting one kind where the
/// other was expected when both share an `attached_to`.
#[derive(Clone, Copy)]
pub enum AnnotationKind {
Pure,
NoSideEffects,
}
impl AnnotationKind {
#[inline]
fn matches(self, comment: &Comment) -> bool {
match self {
Self::Pure => comment.is_pure(),
Self::NoSideEffects => comment.is_no_side_effects(),
}
}
/// Canonical literal to emit when no verbatim source is available.
/// `newline_after = true` is used at statement-level emission sites
/// (function declarations, exports), `false` at inline emission sites
/// (call / new / function expressions).
#[inline]
fn canonical(self, newline_after: bool) -> &'static str {
match (self, newline_after) {
(Self::Pure, false) => "/* @__PURE__ */ ",
(Self::Pure, true) => "/* @__PURE__ */\n",
(Self::NoSideEffects, false) => "/* @__NO_SIDE_EFFECTS__ */ ",
(Self::NoSideEffects, true) => "/* @__NO_SIDE_EFFECTS__ */\n",
}
}
}
impl Codegen<'_> {
pub(crate) fn build_comments(&mut self, comments: &[Comment]) {
if self.options.comments == CommentOptions::disabled() {
return;
}
for comment in comments {
// Stash pure / no-side-effects comments by `attached_to` so the
// emission site can recover the verbatim source text instead of
// falling back to the canonical literal (rolldown#9408).
// Best-effort: when several annotation comments share an
// `attached_to`, only the last survives; the emission site falls
// back to the canonical literal for the dropped ones.
if comment.is_pure() || comment.is_no_side_effects() {
if comment.is_leading() && self.options.print_annotation_comment() {
self.annotation_comments.insert(comment.attached_to, *comment);
}
continue;
}
let mut add = false;
if comment.is_leading() {
if comment.is_legal() && self.options.print_legal_comment() {
add = true;
}
if comment.is_jsdoc() && self.options.print_jsdoc_comment() {
add = true;
}
if comment.is_annotation() && self.options.print_annotation_comment() {
add = true;
}
if comment.is_normal() && self.options.print_normal_comment() {
add = true;
}
}
if add {
if comment.is_legal()
&& let Err(idx) = self.legal_comment_keys.binary_search(&comment.attached_to)
{
self.legal_comment_keys.insert(idx, comment.attached_to);
}
self.comments.entry(comment.attached_to).or_default().push(*comment);
}
}
}
pub(crate) fn has_comment(&self, start: u32) -> bool {
self.comments.contains_key(&start)
}
/// Emit a pure / no-side-effects annotation comment for the AST node at
/// `start`, falling back to the canonical literal when no verbatim source
/// can be recovered.
///
/// The fallback covers four cases:
/// - no annotation comment is stashed at `start`,
/// - the stashed comment's kind doesn't match the emission site (e.g. a
/// `@__NO_SIDE_EFFECTS__` slot being queried by a `CallExpression`
/// site that needs `@__PURE__`),
/// - the comment is a line comment but the site can't break the line, or
/// - source text is unavailable (e.g. the [`Codegen::print_expression`]
/// path that skips [`Codegen::build_comments`]).
///
/// Export sites pass `self.span.start` and only recover verbatim when the
/// annotation precedes the `export` keyword. The rarer
/// `export /* @__NO_SIDE_EFFECTS__ */ function …` form (annotation between
/// `export` and `function`) attaches to the inner function's span and
/// falls back to canonical here.
pub(crate) fn print_annotation_comment(
&mut self,
start: u32,
kind: AnnotationKind,
newline_after: bool,
) {
if self.source_text.is_some()
&& let Some(comment) = self.annotation_comments.get(&start).copied()
&& kind.matches(&comment)
// Inline line comments would swallow the rest of the line.
&& (!comment.is_line() || newline_after)
{
self.annotation_comments.remove(&start);
self.print_comment(&comment);
if newline_after {
self.print_hard_newline();
} else {
self.print_str(" ");
}
return;
}
self.print_str(kind.canonical(newline_after));
}
pub(crate) fn print_leading_comments(&mut self, start: u32) {
if let Some(comments) = self.comments.remove(&start) {
self.print_comments(&comments);
}
}
pub(crate) fn get_comments(&mut self, start: u32) -> Option<Vec<Comment>> {
if self.comments.is_empty() {
return None;
}
self.comments.remove(&start)
}
#[inline]
pub(crate) fn print_comments_at(&mut self, start: u32) {
if let Some(comments) = self.get_comments(start) {
self.print_comments(&comments);
}
}
/// Print leading comments at `start` and consume any pending indent-as-space,
/// so the next token glues to the comment instead of breaking onto a new line.
#[inline]
pub(crate) fn print_leading_comments_anchored_to_self(&mut self, start: u32) {
if let Some(comments) = self.get_comments(start) {
self.print_comments(&comments);
self.consume_pending_indent_space();
}
}
/// Whether a legal-comment orphan with `attached_to < end` is still
/// pending. Used by block emitters to keep an empty body multi-line.
#[inline]
pub(crate) fn has_legal_orphans_before(&self, end: u32) -> bool {
self.legal_comment_keys
.iter()
.take_while(|&&k| k < end)
.any(|k| self.comments.contains_key(k))
}
/// Drain pending legal-comment orphans with `attached_to < end` and emit
/// them in source order. Called at every statement boundary so legal
/// comments survive when their original anchor was removed by DCE.
#[inline]
pub(crate) fn print_legal_orphans_before(&mut self, end: u32) {
if self.legal_comment_keys.is_empty() {
return;
}
let idx = self.legal_comment_keys.partition_point(|&k| k < end);
if idx == 0 {
return;
}
// Concatenate across keys so `print_comments` sees one sequence;
// per-key calls would leak `print_next_indent_as_space` and produce
// stray leading spaces.
let mut legals: Vec<Comment> = Vec::new();
let comments = &mut self.comments;
for k in self.legal_comment_keys.drain(..idx) {
let Some(entry) = comments.get_mut(&k) else { continue };
debug_assert!(entry.iter().any(|c| c.is_legal()));
legals.extend(entry.extract_if(.., |c| c.is_legal()));
if entry.is_empty() {
comments.remove(&k);
}
}
if let Some(last) = legals.last_mut() {
// Orphans aren't in their original position, so the source's
// `followed_by_newline` hint no longer applies. Force it on so
// `print_comments` emits a trailing newline instead of setting
// `print_next_indent_as_space` — otherwise the next indent (often
// before `}`) collapses to a space and pass 2 stops matching.
last.set_followed_by_newline(true);
self.print_comments(&legals);
}
}
/// Print comments attached to any position in the given range `(start, end)` (exclusive).
/// Returns `true` if any comments were printed.
pub(crate) fn print_comments_in_range(&mut self, start: u32, end: u32) -> bool {
if self.comments.is_empty() {
return false;
}
// Find and remove the first key in the range.
let key = self.comments.keys().find(|&&k| k > start && k < end).copied();
if let Some(key) = key {
let comments = self.comments.remove(&key).unwrap();
self.print_comments(&comments);
return true;
}
false
}
pub(crate) fn print_expr_comments(&mut self, start: u32) -> bool {
if self.comments.is_empty() {
return false;
}
let Some(comments) = self.comments.remove(&start) else { return false };
for comment in &comments {
self.print_hard_newline();
self.print_indent();
self.print_comment(comment);
}
if comments.is_empty() {
false
} else {
self.print_hard_newline();
true
}
}
pub(crate) fn print_comments(&mut self, comments: &[Comment]) {
let Some((first, rest)) = comments.split_first() else {
return;
};
if first.preceded_by_newline() {
// Skip printing newline if this comment is already on a newline.
if let Some(b) = self.last_byte() {
match b {
b'\n' => self.print_indent(),
b'\t' => { /* noop */ }
_ => {
self.print_hard_newline();
self.print_indent();
}
}
}
} else {
self.print_indent();
}
self.print_comment(first);
if let Some((last, middle)) = rest.split_last() {
for comment in middle {
if comment.preceded_by_newline() {
self.print_hard_newline();
self.print_indent();
} else if comment.is_legal() {
self.print_hard_newline();
} else {
self.print_soft_space();
}
self.print_comment(comment);
}
if last.preceded_by_newline() {
self.print_hard_newline();
self.print_indent();
} else if last.is_legal() {
self.print_hard_newline();
} else {
self.print_soft_space();
}
self.print_comment(last);
if last.is_line() || last.followed_by_newline() {
self.print_hard_newline();
} else {
self.print_next_indent_as_space = true;
}
} else if first.is_line() || first.followed_by_newline() {
self.print_hard_newline();
} else {
self.print_next_indent_as_space = true;
}
}
fn print_comment(&mut self, comment: &Comment) {
let Some(source_text) = self.source_text else {
return;
};
let comment_source = comment.span.source_text(source_text);
match comment.kind {
CommentKind::Line | CommentKind::SingleLineBlock => {
self.print_str_escaping_script_close_tag(comment_source);
}
CommentKind::MultiLineBlock => {
for line in LineTerminatorSplitter::new(comment_source) {
if !line.starts_with("/*") {
self.print_indent();
}
self.print_str_escaping_script_close_tag(line.trim_start());
if !line.ends_with("*/") {
self.print_hard_newline();
}
}
}
}
}
/// Handle Eof / Linked / External Comments.
/// Return a list of comments of linked or external.
pub(crate) fn handle_eof_linked_or_external_comments(
&mut self,
program: &Program<'_>,
) -> Vec<Comment> {
let legal_comments = &self.options.comments.legal;
if matches!(legal_comments, LegalComment::None | LegalComment::Inline) {
return vec![];
}
// Dedupe legal comments for smaller output size.
let mut set = FxHashSet::default();
let mut comments = vec![];
let source_text = program.source_text;
for comment in program.comments.iter().filter(|c| c.is_legal()) {
let mut text = Cow::Borrowed(comment.span.source_text(source_text));
if comment.is_multiline_block() {
let mut buffer = String::with_capacity(text.len());
// Print block comments with our own indentation.
for line in LineTerminatorSplitter::new(&text) {
if !line.starts_with("/*") {
buffer.push('\t');
}
buffer.push_str(line.trim_start());
if !line.ends_with("*/") {
buffer.push('\n');
}
}
text = Cow::Owned(buffer);
}
if set.insert(text) {
comments.push(*comment);
}
}
if comments.is_empty() {
return vec![];
}
match legal_comments {
LegalComment::Eof => {
self.print_hard_newline();
// Clear the flag to ensure consistent formatting for all EOF comments
self.print_next_indent_as_space = false;
for c in comments {
self.print_comment(&c);
self.print_hard_newline();
}
vec![]
}
LegalComment::Linked(path) => {
let path = path.clone();
self.print_hard_newline();
self.print_str("/*! For license information please see ");
self.print_str(&path);
self.print_str(" */");
comments
}
LegalComment::External => comments,
LegalComment::None | LegalComment::Inline => unreachable!(),
}
}
}