1#![allow(clippy::too_many_arguments)]
2
3#[cfg(target_arch = "aarch64")]
33use std::arch::aarch64::vandq_u8;
34#[cfg(target_arch = "aarch64")]
35use std::arch::aarch64::vceqq_u8;
36#[cfg(target_arch = "aarch64")]
37use std::arch::aarch64::vcgeq_u8;
38#[cfg(target_arch = "aarch64")]
39use std::arch::aarch64::vcleq_u8;
40#[cfg(target_arch = "aarch64")]
41use std::arch::aarch64::vdupq_n_u8;
42#[cfg(target_arch = "aarch64")]
43use std::arch::aarch64::vld1q_u8;
44#[cfg(target_arch = "aarch64")]
45use std::arch::aarch64::vminvq_u8;
46#[cfg(target_arch = "aarch64")]
47use std::arch::aarch64::vorrq_u8;
48#[cfg(target_arch = "x86_64")]
49use std::arch::x86_64::*;
50use std::collections::HashMap;
51use std::collections::HashSet;
52use std::hash::BuildHasherDefault;
53
54use ustr::IdentityHasher;
55
56pub use ustr::Ustr as Atom;
57pub use ustr::ustr as atom;
58
59pub type AtomMap<V> = HashMap<Atom, V, BuildHasherDefault<IdentityHasher>>;
64
65pub type AtomSet = HashSet<Atom, BuildHasherDefault<IdentityHasher>>;
70
71const STACK_BUF_SIZE: usize = 256;
73
74thread_local! {
75 static EMPTY_ATOM: Atom = atom("");
76}
77
78#[inline]
82#[must_use]
83pub fn empty_atom() -> Atom {
84 EMPTY_ATOM.with(|&atom| atom)
85}
86
87#[macro_export]
97macro_rules! concat_atom {
98 ($s1:expr, $s2:expr $(,)?) => {
99 $crate::concat_atom2(&$s1, &$s2)
100 };
101 ($s1:expr, $s2:expr, $s3:expr $(,)?) => {
102 $crate::concat_atom3(&$s1, &$s2, &$s3)
103 };
104 ($s1:expr, $s2:expr, $s3:expr, $s4:expr $(,)?) => {
105 $crate::concat_atom4(&$s1, &$s2, &$s3, &$s4)
106 };
107 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr $(,)?) => {
108 $crate::concat_atom5(&$s1, &$s2, &$s3, &$s4, &$s5)
109 };
110 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr $(,)?) => {
111 $crate::concat_atom6(&$s1, &$s2, &$s3, &$s4, &$s5, &$s6)
112 };
113 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr, $s7:expr $(,)?) => {
114 $crate::concat_atom7(&$s1, &$s2, &$s3, &$s4, &$s5, &$s6, &$s7)
115 };
116 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr, $s7:expr, $s8:expr $(,)?) => {
117 $crate::concat_atom8(&$s1, &$s2, &$s3, &$s4, &$s5, &$s6, &$s7, &$s8)
118 };
119 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr, $s7:expr, $s8:expr, $s9:expr $(,)?) => {
120 $crate::concat_atom9(&$s1, &$s2, &$s3, &$s4, &$s5, &$s6, &$s7, &$s8, &$s9)
121 };
122 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr, $s7:expr, $s8:expr, $s9:expr, $s10:expr $(,)?) => {
123 $crate::concat_atom10(&$s1, &$s2, &$s3, &$s4, &$s5, &$s6, &$s7, &$s8, &$s9, &$s10)
124 };
125 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr, $s7:expr, $s8:expr, $s9:expr, $s10:expr, $s11:expr $(,)?) => {
126 $crate::concat_atom11(&$s1, &$s2, &$s3, &$s4, &$s5, &$s6, &$s7, &$s8, &$s9, &$s10, &$s11)
127 };
128 ($s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr, $s7:expr, $s8:expr, $s9:expr, $s10:expr, $s11:expr, $s12:expr $(,)?) => {
129 $crate::concat_atom12(&$s1, &$s2, &$s3, &$s4, &$s5, &$s6, &$s7, &$s8, &$s9, &$s10, &$s11, &$s12)
130 };
131 ($($arg:expr),+ $(,)?) => {
132 compile_error!("concat_atom! macro supports between 2 and 12 arguments only")
133 };
134}
135
136#[inline]
142#[must_use]
143pub fn ascii_lowercase_constant_name_atom(name: &str) -> Atom {
144 if let Some(last_slash_idx) = name.rfind('\\') {
145 let (namespace, const_name) = name.split_at(last_slash_idx);
146 let const_name = &const_name[1..];
147
148 if name.len() > STACK_BUF_SIZE {
149 let mut lowercased_namespace = namespace.to_ascii_lowercase();
150 lowercased_namespace.push('\\');
151 lowercased_namespace.push_str(const_name);
152 return atom(&lowercased_namespace);
153 }
154
155 let mut stack_buf = [0u8; STACK_BUF_SIZE];
156 let mut index = 0;
157
158 for byte in namespace.bytes() {
159 stack_buf[index] = byte.to_ascii_lowercase();
160 index += 1;
161 }
162
163 stack_buf[index] = b'\\';
164 index += 1;
165
166 let const_bytes = const_name.as_bytes();
167 stack_buf[index..index + const_bytes.len()].copy_from_slice(const_bytes);
168 index += const_bytes.len();
169
170 atom(
171 unsafe { std::str::from_utf8_unchecked(&stack_buf[..index]) },
173 )
174 } else {
175 atom(name)
176 }
177}
178
179#[inline]
186#[must_use]
187pub fn ascii_lowercase_atom(s: &str) -> Atom {
188 let bytes = s.as_bytes();
189
190 if !bytes.iter().any(u8::is_ascii_uppercase) {
192 return atom(s);
193 }
194
195 if s.len() <= STACK_BUF_SIZE {
197 let mut stack_buf = [0u8; STACK_BUF_SIZE];
198 for (i, &b) in bytes.iter().enumerate() {
199 stack_buf[i] = b.to_ascii_lowercase();
200 }
201 return atom(
202 unsafe { std::str::from_utf8_unchecked(&stack_buf[..s.len()]) },
204 );
205 }
206
207 atom(&s.to_ascii_lowercase())
208}
209
210#[inline]
227#[must_use]
228pub fn starts_with_ignore_case(haystack: &str, prefix: &str) -> bool {
229 #[cfg(target_arch = "x86_64")]
230 #[target_feature(enable = "avx2")]
231 unsafe fn starts_with_avx2(haystack: &str, prefix: &str, len: usize) -> bool {
232 unsafe {
233 let haystack_bytes = haystack.as_bytes();
234 let prefix_bytes = prefix.as_bytes();
235
236 let lower_a = _mm256_set1_epi8(b'a' as i8);
237 let lower_z = _mm256_set1_epi8(b'z' as i8);
238 let case_bit = _mm256_set1_epi8(0x20);
239
240 let mut i = 0;
241 while i + 32 <= len {
242 let h = _mm256_loadu_si256(haystack_bytes.as_ptr().add(i) as *const __m256i);
243 let p = _mm256_loadu_si256(prefix_bytes.as_ptr().add(i) as *const __m256i);
244
245 let h_is_lower = _mm256_and_si256(
247 _mm256_cmpgt_epi8(h, _mm256_sub_epi8(lower_a, _mm256_set1_epi8(1))),
248 _mm256_cmpgt_epi8(_mm256_add_epi8(lower_z, _mm256_set1_epi8(1)), h),
249 );
250 let h_lower = _mm256_or_si256(h, _mm256_and_si256(h_is_lower, case_bit));
251
252 let p_is_lower = _mm256_and_si256(
254 _mm256_cmpgt_epi8(p, _mm256_sub_epi8(lower_a, _mm256_set1_epi8(1))),
255 _mm256_cmpgt_epi8(_mm256_add_epi8(lower_z, _mm256_set1_epi8(1)), p),
256 );
257 let p_lower = _mm256_or_si256(p, _mm256_and_si256(p_is_lower, case_bit));
258
259 let eq = _mm256_cmpeq_epi8(h_lower, p_lower);
260 let mask = _mm256_movemask_epi8(eq);
261 if mask != -1i32 {
262 return false;
263 }
264
265 i += 32;
266 }
267
268 haystack_bytes[i..len].eq_ignore_ascii_case(&prefix_bytes[i..len])
270 }
271 }
272
273 #[cfg(target_arch = "aarch64")]
274 #[target_feature(enable = "neon")]
275 unsafe fn starts_with_neon(haystack: &str, prefix: &str, len: usize) -> bool {
276 unsafe {
277 let haystack_bytes = haystack.as_bytes();
278 let prefix_bytes = prefix.as_bytes();
279
280 let lower_a = vdupq_n_u8(b'a');
281 let lower_z = vdupq_n_u8(b'z');
282 let case_bit = vdupq_n_u8(0x20);
283
284 let mut i = 0;
285 while i + 16 <= len {
286 let h = vld1q_u8(haystack_bytes.as_ptr().add(i));
287 let p = vld1q_u8(prefix_bytes.as_ptr().add(i));
288
289 let h_ge_a = vcgeq_u8(h, lower_a);
291 let h_le_z = vcleq_u8(h, lower_z);
292 let h_is_lower = vandq_u8(h_ge_a, h_le_z);
293 let h_lower = vorrq_u8(h, vandq_u8(h_is_lower, case_bit));
294
295 let p_ge_a = vcgeq_u8(p, lower_a);
297 let p_le_z = vcleq_u8(p, lower_z);
298 let p_is_lower = vandq_u8(p_ge_a, p_le_z);
299 let p_lower = vorrq_u8(p, vandq_u8(p_is_lower, case_bit));
300
301 let eq = vceqq_u8(h_lower, p_lower);
302 let min = vminvq_u8(eq);
303 if min != 0xFF {
304 return false;
305 }
306
307 i += 16;
308 }
309
310 haystack_bytes[i..len].eq_ignore_ascii_case(&prefix_bytes[i..len])
312 }
313 }
314
315 let len = prefix.len();
316 if haystack.len() < len {
317 return false;
318 }
319
320 #[cfg(target_arch = "x86_64")]
321 {
322 if len >= 32 && std::is_x86_feature_detected!("avx2") {
323 return unsafe { starts_with_avx2(haystack, prefix, len) };
325 }
326 }
327
328 #[cfg(target_arch = "aarch64")]
329 {
330 if len >= 16 {
331 return unsafe { starts_with_neon(haystack, prefix, len) };
333 }
334 }
335
336 haystack.as_bytes()[..len].eq_ignore_ascii_case(prefix.as_bytes())
337}
338
339macro_rules! integer_to_atom_fns {
341 ( $( $func_name:ident($num_type:ty) ),+ $(,)? ) => {
342 $(
343 #[doc = "Creates an `Atom` from a `"]
344 #[doc = stringify!($num_type)]
345 #[doc = "` value with zero heap allocations."]
346 #[inline]
347 #[must_use]
348 pub fn $func_name(n: $num_type) -> Atom {
349 let mut buffer = itoa::Buffer::new();
350 let s = buffer.format(n);
351
352 atom(s)
353 }
354 )+
355 };
356}
357
358macro_rules! float_to_atom_fns {
360 ( $( $func_name:ident($num_type:ty) ),+ $(,)? ) => {
361 $(
362 #[doc = "Creates an `Atom` from a `"]
363 #[doc = stringify!($num_type)]
364 #[doc = "` value with zero heap allocations."]
365 #[inline]
366 #[must_use]
367 pub fn $func_name(n: $num_type) -> Atom {
368 let mut buffer = ryu::Buffer::new();
369 let s = buffer.format(n);
370
371 atom(s)
372 }
373 )+
374 };
375}
376
377macro_rules! concat_fns {
379 ( $( $func_name:ident($n:literal, $($s:ident),+) ),+ $(,)?) => {
380 $(
381 #[doc = "Creates an `Atom` as a result of concatenating "]
382 #[doc = stringify!($n)]
383 #[doc = " string slices."]
384 #[inline]
385 #[must_use]
386 #[allow(unused_assignments)]
387 pub fn $func_name($($s: &str),+) -> Atom {
388 let total_len = 0 $(+ $s.len())+;
389
390 if total_len <= STACK_BUF_SIZE {
391 let mut buffer = [0u8; STACK_BUF_SIZE];
392 let mut index = 0;
393 $(
394 buffer[index..index + $s.len()].copy_from_slice($s.as_bytes());
395 index += $s.len();
396 )+
397 return atom(unsafe { std::str::from_utf8_unchecked(&buffer[..total_len]) });
398 }
399
400 let mut result = String::with_capacity(total_len);
402 $( result.push_str($s); )+
403 atom(&result)
404 }
405 )+
406 };
407}
408
409integer_to_atom_fns!(
411 i8_atom(i8),
412 i16_atom(i16),
413 i32_atom(i32),
414 i64_atom(i64),
415 i128_atom(i128),
416 isize_atom(isize),
417 u8_atom(u8),
418 u16_atom(u16),
419 u32_atom(u32),
420 u64_atom(u64),
421 u128_atom(u128),
422 usize_atom(usize),
423);
424
425float_to_atom_fns!(f32_atom(f32), f64_atom(f64),);
426
427concat_fns!(
428 concat_atom2(2, s1, s2),
429 concat_atom3(3, s1, s2, s3),
430 concat_atom4(4, s1, s2, s3, s4),
431 concat_atom5(5, s1, s2, s3, s4, s5),
432 concat_atom6(6, s1, s2, s3, s4, s5, s6),
433 concat_atom7(7, s1, s2, s3, s4, s5, s6, s7),
434 concat_atom8(8, s1, s2, s3, s4, s5, s6, s7, s8),
435 concat_atom9(9, s1, s2, s3, s4, s5, s6, s7, s8, s9),
436 concat_atom10(10, s1, s2, s3, s4, s5, s6, s7, s8, s9, s10),
437 concat_atom11(11, s1, s2, s3, s4, s5, s6, s7, s8, s9, s10, s11),
438 concat_atom12(12, s1, s2, s3, s4, s5, s6, s7, s8, s9, s10, s11, s12),
439);