1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
use std::fmt;
use std::io::{self, Write};
const UTF8_START: &[u8] = &[0x1B, 0x25, 0x47];
const UTF8_END: &[u8] = &[0x1B, 0x25, 0x40];
#[derive(Clone, Copy)]
#[repr(transparent)]
pub struct CText<'s> {
utf8: &'s str,
}
impl<'s> fmt::Debug for CText<'s> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
f.write_str(self.utf8)
}
}
impl<'s> fmt::Display for CText<'s> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
f.write_str(self.utf8)
}
}
impl<'s> CText<'s> {
pub const fn new(utf8: &'s str) -> Self {
Self {
utf8
}
}
pub const fn len(self) -> usize {
self.utf8.len() + UTF8_START.len() + UTF8_END.len()
}
pub fn write(self, mut out: impl Write) -> io::Result<usize> {
let mut writed = 0;
writed += out.write(UTF8_START)?;
writed += out.write(self.utf8.as_bytes())?;
writed += out.write(UTF8_END)?;
Ok(writed)
}
}
pub fn utf8_to_compound_text(text: &str) -> Vec<u8> {
let mut ret = Vec::with_capacity(text.len() + 6);
ret.extend_from_slice(UTF8_START);
ret.extend_from_slice(text.as_bytes());
ret.extend_from_slice(UTF8_END);
ret
}
pub fn compound_text_to_utf8(bytes: &[u8]) -> Result<&str, ()> {
if bytes.starts_with(UTF8_START) && bytes.ends_with(UTF8_END) {
std::str::from_utf8(&bytes[3..bytes.len() - 3]).map_err(|_| ())
} else {
Err(())
}
}
#[cfg(test)]
mod tests {
#[test]
fn korean() {
const UTF8: &str = "가나다";
const COMP: &[u8] = &[
27, 37, 71, 234, 176, 128, 235, 130, 152, 235, 139, 164, 27, 37, 64,
];
assert_eq!(crate::utf8_to_compound_text(UTF8), COMP);
assert_eq!(crate::compound_text_to_utf8(COMP).unwrap(), UTF8);
}
}