use core::str;
use crate::{DeserializeRevisioned, Error, Revisioned, SerializeRevisioned};
use super::vecs::serialize_bytes;
impl SerializeRevisioned for String {
#[inline]
fn serialize_revisioned<W: std::io::Write>(&self, writer: &mut W) -> Result<(), Error> {
serialize_bytes(self.as_bytes(), writer)
}
}
impl DeserializeRevisioned for String {
#[inline]
fn deserialize_revisioned<R: std::io::Read>(reader: &mut R) -> Result<Self, Error> {
let len = usize::deserialize_revisioned(reader)?;
if len == 0 {
return Ok(String::new());
}
let mut buf = vec![0u8; len];
reader.read_exact(&mut buf).map_err(Error::Io)?;
String::from_utf8(buf).map_err(|x| Error::Utf8Error(x.utf8_error()))
}
}
impl Revisioned for String {
#[inline]
fn revision() -> u16 {
1
}
}
impl SerializeRevisioned for str {
#[inline]
fn serialize_revisioned<W: std::io::Write>(&self, writer: &mut W) -> Result<(), Error> {
serialize_bytes(self.as_bytes(), writer)
}
}
impl Revisioned for str {
#[inline]
fn revision() -> u16 {
1
}
}
impl SerializeRevisioned for char {
#[inline]
fn serialize_revisioned<W: std::io::Write>(&self, w: &mut W) -> Result<(), Error> {
let buffer = &mut [0u8; 4];
w.write_all(self.encode_utf8(buffer).as_bytes()).map_err(Error::Io)
}
}
impl DeserializeRevisioned for char {
#[inline]
fn deserialize_revisioned<R: std::io::Read>(r: &mut R) -> Result<Self, Error> {
let mut buffer = [0u8; 4];
r.read_exact(&mut buffer[..1]).map_err(Error::Io)?;
let len = CHAR_LENGTH[buffer[0] as usize];
if len == 0 {
return Err(Error::InvalidCharEncoding);
}
r.read_exact(&mut buffer[1..(len as usize)]).map_err(Error::Io)?;
str::from_utf8(&buffer[..(len as usize)])
.map_err(|_| Error::InvalidCharEncoding)
.map(|x| x.chars().next().unwrap())
}
}
impl Revisioned for char {
#[inline]
fn revision() -> u16 {
1
}
}
static CHAR_LENGTH: [u8; 256] = const {
let mut r = [0u8; 256];
let mut i = 0;
while i < 256 {
if i & 0b1000_0000 == 0 {
r[i] = 1;
} else if i & 0b1110_0000 == 0b1100_0000 {
r[i] = 2;
} else if i & 0b1111_0000 == 0b1110_0000 {
r[i] = 3;
} else if i & 0b1111_1000 == 0b1111_0000 {
r[i] = 4;
}
i += 1;
}
r
};
#[cfg(test)]
mod tests {
use super::*;
use crate::implementations::assert_bincode_compat;
#[test]
fn test_string() {
let val = String::from("this is a test");
let mut mem: Vec<u8> = vec![];
val.serialize_revisioned(&mut mem).unwrap();
#[cfg(not(feature = "fixed-width-encoding"))]
assert_eq!(mem.len(), 15);
#[cfg(feature = "fixed-width-encoding")]
assert_eq!(mem.len(), 22);
let out =
<String as DeserializeRevisioned>::deserialize_revisioned(&mut mem.as_slice()).unwrap();
assert_eq!(val, out);
}
#[test]
fn test_char() {
let char = '𐃌';
let mut mem = Vec::new();
char.serialize_revisioned(&mut mem).unwrap();
let out = DeserializeRevisioned::deserialize_revisioned(&mut mem.as_slice()).unwrap();
assert_eq!(char, out);
}
#[test]
fn bincode_compat_char() {
assert_bincode_compat(&char::MAX);
assert_bincode_compat(&'\0');
assert_bincode_compat(&'z');
assert_bincode_compat(&'0');
assert_bincode_compat(&'ʘ');
assert_bincode_compat(&'ꚸ');
assert_bincode_compat(&'𐃌');
}
#[test]
fn str_and_string_serialize_identically() {
let cases: &[&str] = &[
"",
"a",
"this is a test",
"unicode: 🚀🔥✨",
"with\0embedded\0nuls",
&"x".repeat(300),
];
for &s in cases {
let mut from_str: Vec<u8> = Vec::new();
<str as SerializeRevisioned>::serialize_revisioned(s, &mut from_str).unwrap();
let owned = s.to_owned();
let mut from_string: Vec<u8> = Vec::new();
owned.serialize_revisioned(&mut from_string).unwrap();
assert_eq!(
from_str, from_string,
"str and String serialisation diverged for input {:?}",
s
);
let out =
<String as DeserializeRevisioned>::deserialize_revisioned(&mut from_str.as_slice())
.unwrap();
assert_eq!(out, owned);
}
}
#[test]
fn bincode_compat_string() {
assert_bincode_compat(&char::MAX.to_string());
assert_bincode_compat(&'\0'.to_string());
assert_bincode_compat(&'z'.to_string());
assert_bincode_compat(&'0'.to_string());
assert_bincode_compat(&'ʘ'.to_string());
assert_bincode_compat(&'ꚸ'.to_string());
assert_bincode_compat(&'𐃌'.to_string());
}
}