#[macro_export]
macro_rules! big_if_true {
($a:expr) => {
if $a {
1
} else {
0
}
};
}
type WChar = u32;
type Interval = (WChar, WChar);
pub struct CodePointsIterator<'a> {
rest: std::str::Chars<'a>,
}
impl Iterator for CodePointsIterator<'_> {
type Item = WChar;
fn next(&mut self) -> Option<WChar> {
self.rest.next().map(|c| c as WChar)
}
}
pub trait CodePointsIter {
fn code_points(&self) -> CodePointsIterator<'_>;
}
impl CodePointsIter for str {
fn code_points(&self) -> CodePointsIterator<'_> {
CodePointsIterator { rest: self.chars() }
}
}
impl CodePointsIter for &str {
fn code_points(&self) -> CodePointsIterator<'_> {
CodePointsIterator { rest: self.chars() }
}
}
fn bisearch(ucs: WChar, table: &'static [Interval]) -> bool {
let mut min = 0;
let mut mid;
if table.is_empty() {
return false;
}
let mut max = table.len() - 1;
if ucs < table[0].0 || ucs > table[max].1 {
return false;
}
while max >= min {
mid = (min + max) / 2;
if ucs > table[mid].1 {
min = mid + 1;
} else if ucs < table[mid].0 {
max = mid - 1;
} else {
return true;
}
}
false
}
pub fn wcwidth(ucs: WChar) -> Option<usize> {
if bisearch(ucs, super::tables::ASCII) {
Some(1)
} else if bisearch(ucs, super::tables::PRIVATE)
|| bisearch(ucs, super::tables::NONPRINT)
|| bisearch(ucs, super::tables::COMBINING)
{
None
} else if bisearch(ucs, super::tables::DOUBLEWIDE) {
Some(2)
} else if bisearch(ucs, super::tables::AMBIGUOUS) {
Some(1)
} else if bisearch(ucs, super::tables::UNASSIGNED) || bisearch(ucs, super::tables::WIDENEDIN9) {
Some(2)
} else {
Some(1)
}
}
pub fn wcswidth(mut pwcs: WChar, mut n: usize) -> Option<usize> {
let mut width = 0;
while pwcs > 0 && n > 0 {
if let Some(w) = wcwidth(pwcs) {
width += w;
} else {
return None;
}
pwcs += 1;
n -= 1;
}
Some(width)
}
#[cfg(test)]
mod tests {
use super::*;
use crate::text::{grapheme_clusters::TextProcessing, TextPresentation};
#[test]
fn test_wcwidth() {
assert_eq!(
&"abc\0".code_points().collect::<Vec<_>>(),
&[0x61, 0x62, 0x63, 0x0]
);
assert_eq!(&"●".code_points().collect::<Vec<_>>(), &[0x25cf]);
assert_eq!(&"📎".code_points().collect::<Vec<_>>(), &[0x1f4ce]);
assert_eq!(
&"𐼹𐼺𐼻𐼼𐼽".code_points().collect::<Vec<_>>(),
&[0x10F39, 0x10F3A, 0x10F3B, 0x10F3C, 0x10F3D]
); assert_eq!(
&"𐼹a𐼽b".code_points().collect::<Vec<_>>(),
&[0x10F39, 0x61, 0x10F3D, 0x62]
); assert_eq!(
&"📎\u{FE0E}".code_points().collect::<Vec<_>>(),
&[0x1f4ce, 0xfe0e]
);
assert_eq!("●".grapheme_width(), 1);
assert_eq!("●📎".grapheme_width(), 3);
assert_eq!("●📎︎".grapheme_width(), 3);
assert_eq!("●\u{FE0E}📎\u{FE0E}".grapheme_width(), 3);
assert_eq!("🎃".grapheme_width(), 2);
assert_eq!("👻".grapheme_width(), 2);
assert_eq!("🛡︎".grapheme_width(), 2);
assert_eq!("🛡︎".text_pr().grapheme_width(), 2);
assert_eq!("こんにちわ世界".grapheme_width(), 14);
assert_eq!("こ★ん■に●ち▲わ☆世◆界".grapheme_width(), 20);
}
}