#![allow(dead_code)]
#![allow(unused)]
use crate::__internal::runtime::InnerProtoString;
use crate::__internal::{Private, SealedInternal};
use crate::{
utf8::Utf8Chunks, AsView, IntoProxied, IntoView, Mut, MutProxied, MutProxy, Optional, Proxied,
Proxy, View, ViewProxy,
};
use std::borrow::Cow;
use std::cmp::{Eq, Ord, Ordering, PartialEq, PartialOrd};
use std::convert::{AsMut, AsRef};
use std::ffi::{OsStr, OsString};
use std::fmt;
use std::hash::{Hash, Hasher};
use std::iter;
use std::ops::{Deref, DerefMut};
use std::ptr;
use std::rc::Rc;
use std::sync::Arc;
pub struct ProtoBytes {
pub(crate) inner: InnerProtoString,
}
impl ProtoBytes {
#[doc(hidden)]
pub fn into_inner(self, _private: Private) -> InnerProtoString {
self.inner
}
#[doc(hidden)]
pub fn from_inner(_private: Private, inner: InnerProtoString) -> ProtoBytes {
Self { inner }
}
pub fn as_view(&self) -> &[u8] {
self.inner.as_bytes()
}
}
impl AsRef<[u8]> for ProtoBytes {
fn as_ref(&self) -> &[u8] {
self.inner.as_bytes()
}
}
impl From<&[u8]> for ProtoBytes {
fn from(v: &[u8]) -> ProtoBytes {
ProtoBytes { inner: InnerProtoString::from(v) }
}
}
impl<const N: usize> From<&[u8; N]> for ProtoBytes {
fn from(v: &[u8; N]) -> ProtoBytes {
ProtoBytes { inner: InnerProtoString::from(v.as_ref()) }
}
}
impl SealedInternal for ProtoBytes {}
impl Proxied for ProtoBytes {
type View<'msg> = &'msg [u8];
}
impl AsView for ProtoBytes {
type Proxied = Self;
fn as_view(&self) -> &[u8] {
self.as_view()
}
}
impl IntoProxied<ProtoBytes> for &[u8] {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(self)
}
}
impl<const N: usize> IntoProxied<ProtoBytes> for &[u8; N] {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(self.as_ref())
}
}
impl IntoProxied<ProtoBytes> for Vec<u8> {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(AsRef::<[u8]>::as_ref(&self))
}
}
impl IntoProxied<ProtoBytes> for &Vec<u8> {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(AsRef::<[u8]>::as_ref(self))
}
}
impl IntoProxied<ProtoBytes> for Box<[u8]> {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(AsRef::<[u8]>::as_ref(&self))
}
}
impl IntoProxied<ProtoBytes> for Cow<'_, [u8]> {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(AsRef::<[u8]>::as_ref(&self))
}
}
impl IntoProxied<ProtoBytes> for Rc<[u8]> {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(AsRef::<[u8]>::as_ref(&self))
}
}
impl IntoProxied<ProtoBytes> for Arc<[u8]> {
fn into_proxied(self, _private: Private) -> ProtoBytes {
ProtoBytes::from(AsRef::<[u8]>::as_ref(&self))
}
}
impl SealedInternal for &[u8] {}
impl<'msg> Proxy<'msg> for &'msg [u8] {}
impl AsView for &[u8] {
type Proxied = ProtoBytes;
fn as_view(&self) -> &[u8] {
self
}
}
impl<'msg> IntoView<'msg> for &'msg [u8] {
fn into_view<'shorter>(self) -> &'shorter [u8]
where
'msg: 'shorter,
{
self
}
}
impl<'msg> ViewProxy<'msg> for &'msg [u8] {}
#[derive(Debug, PartialEq)]
pub struct Utf8Error {
pub(crate) inner: std::str::Utf8Error,
}
impl std::fmt::Display for Utf8Error {
fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
self.inner.fmt(f)
}
}
impl std::error::Error for Utf8Error {}
impl From<std::str::Utf8Error> for Utf8Error {
fn from(inner: std::str::Utf8Error) -> Utf8Error {
Utf8Error { inner }
}
}
pub struct ProtoString {
pub(crate) inner: InnerProtoString,
}
impl ProtoString {
pub fn as_view(&self) -> &ProtoStr {
unsafe { ProtoStr::from_utf8_unchecked(self.as_bytes()) }
}
pub fn as_bytes(&self) -> &[u8] {
self.inner.as_bytes()
}
#[doc(hidden)]
pub fn into_inner(self, _private: Private) -> InnerProtoString {
self.inner
}
#[doc(hidden)]
pub fn from_inner(_private: Private, inner: InnerProtoString) -> ProtoString {
Self { inner }
}
}
impl SealedInternal for ProtoString {}
impl AsRef<[u8]> for ProtoString {
fn as_ref(&self) -> &[u8] {
self.inner.as_bytes()
}
}
impl From<ProtoString> for ProtoBytes {
fn from(v: ProtoString) -> Self {
ProtoBytes { inner: v.inner }
}
}
impl From<&str> for ProtoString {
fn from(v: &str) -> Self {
Self::from(v.as_bytes())
}
}
impl From<&[u8]> for ProtoString {
fn from(v: &[u8]) -> Self {
Self { inner: InnerProtoString::from(v) }
}
}
impl SealedInternal for &str {}
impl SealedInternal for &ProtoStr {}
impl IntoProxied<ProtoString> for &str {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(self)
}
}
impl IntoProxied<ProtoString> for &ProtoStr {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(self.as_bytes())
}
}
impl IntoProxied<ProtoString> for String {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(self.as_str())
}
}
impl IntoProxied<ProtoString> for &String {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(self.as_bytes())
}
}
impl IntoProxied<ProtoString> for OsString {
fn into_proxied(self, private: Private) -> ProtoString {
self.as_os_str().into_proxied(private)
}
}
impl IntoProxied<ProtoString> for &OsStr {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(self.as_encoded_bytes())
}
}
impl IntoProxied<ProtoString> for Box<str> {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(AsRef::<str>::as_ref(&self))
}
}
impl IntoProxied<ProtoString> for Cow<'_, str> {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(AsRef::<str>::as_ref(&self))
}
}
impl IntoProxied<ProtoString> for Rc<str> {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(AsRef::<str>::as_ref(&self))
}
}
impl IntoProxied<ProtoString> for Arc<str> {
fn into_proxied(self, _private: Private) -> ProtoString {
ProtoString::from(AsRef::<str>::as_ref(&self))
}
}
#[repr(transparent)]
pub struct ProtoStr([u8]);
impl ProtoStr {
pub fn as_bytes(&self) -> &[u8] {
&self.0
}
pub fn to_str(&self) -> Result<&str, Utf8Error> {
Ok(std::str::from_utf8(&self.0)?)
}
pub fn to_cow_lossy(&self) -> Cow<'_, str> {
String::from_utf8_lossy(&self.0)
}
pub fn is_empty(&self) -> bool {
self.0.is_empty()
}
pub fn len(&self) -> usize {
self.0.len()
}
pub fn chars(&self) -> impl Iterator<Item = char> + '_ + fmt::Debug {
Utf8Chunks::new(self.as_bytes()).flat_map(|chunk| {
let mut yield_replacement_char = !chunk.invalid().is_empty();
chunk.valid().chars().chain(iter::from_fn(move || {
yield_replacement_char.then(|| {
yield_replacement_char = false;
char::REPLACEMENT_CHARACTER
})
}))
})
}
pub fn utf8_chunks(&self) -> impl Iterator<Item = Result<&str, &[u8]>> + '_ {
Utf8Chunks::new(self.as_bytes()).flat_map(|chunk| {
let valid = chunk.valid();
let invalid = chunk.invalid();
(!valid.is_empty())
.then_some(Ok(valid))
.into_iter()
.chain((!invalid.is_empty()).then_some(Err(invalid)))
})
}
pub unsafe fn from_utf8_unchecked(bytes: &[u8]) -> &Self {
unsafe { &*(bytes as *const [u8] as *const Self) }
}
pub fn from_str(string: &str) -> &Self {
unsafe { Self::from_utf8_unchecked(string.as_bytes()) }
}
}
impl AsRef<[u8]> for ProtoStr {
fn as_ref(&self) -> &[u8] {
self.as_bytes()
}
}
impl<'msg> From<&'msg ProtoStr> for &'msg [u8] {
fn from(val: &'msg ProtoStr) -> &'msg [u8] {
val.as_bytes()
}
}
impl<'msg> From<&'msg str> for &'msg ProtoStr {
fn from(val: &'msg str) -> &'msg ProtoStr {
ProtoStr::from_str(val)
}
}
impl<'msg> TryFrom<&'msg ProtoStr> for &'msg str {
type Error = Utf8Error;
fn try_from(val: &'msg ProtoStr) -> Result<&'msg str, Utf8Error> {
val.to_str()
}
}
impl<'msg> TryFrom<&'msg [u8]> for &'msg ProtoStr {
type Error = Utf8Error;
fn try_from(val: &'msg [u8]) -> Result<&'msg ProtoStr, Utf8Error> {
Ok(ProtoStr::from_str(std::str::from_utf8(val)?))
}
}
impl fmt::Debug for ProtoStr {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
fmt::Debug::fmt(&Utf8Chunks::new(self.as_bytes()).debug(), f)
}
}
impl fmt::Display for ProtoStr {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
use std::fmt::Write as _;
for chunk in Utf8Chunks::new(self.as_bytes()) {
fmt::Display::fmt(chunk.valid(), f)?;
if !chunk.invalid().is_empty() {
f.write_char(char::REPLACEMENT_CHARACTER)?;
}
}
Ok(())
}
}
impl Hash for ProtoStr {
fn hash<H: Hasher>(&self, state: &mut H) {
self.as_bytes().hash(state)
}
}
impl Eq for ProtoStr {}
impl Ord for ProtoStr {
fn cmp(&self, other: &ProtoStr) -> Ordering {
self.as_bytes().cmp(other.as_bytes())
}
}
impl Proxied for ProtoString {
type View<'msg> = &'msg ProtoStr;
}
impl AsView for ProtoString {
type Proxied = Self;
fn as_view(&self) -> &ProtoStr {
self.as_view()
}
}
impl<'msg> Proxy<'msg> for &'msg ProtoStr {}
impl AsView for &ProtoStr {
type Proxied = ProtoString;
fn as_view(&self) -> &ProtoStr {
self
}
}
impl<'msg> IntoView<'msg> for &'msg ProtoStr {
fn into_view<'shorter>(self) -> &'shorter ProtoStr
where
'msg: 'shorter,
{
self
}
}
impl<'msg> ViewProxy<'msg> for &'msg ProtoStr {}
macro_rules! impl_bytes_partial_cmp {
($(<($($generics:tt)*)> $lhs:ty => $rhs:ty),+ $(,)?) => {
$(
impl<$($generics)*> PartialEq<$rhs> for $lhs {
fn eq(&self, other: &$rhs) -> bool {
AsRef::<[u8]>::as_ref(self) == AsRef::<[u8]>::as_ref(other)
}
}
impl<$($generics)*> PartialOrd<$rhs> for $lhs {
fn partial_cmp(&self, other: &$rhs) -> Option<Ordering> {
AsRef::<[u8]>::as_ref(self).partial_cmp(AsRef::<[u8]>::as_ref(other))
}
}
)*
};
}
impl_bytes_partial_cmp!(
<()> ProtoStr => ProtoStr,
<()> ProtoStr => str,
<()> str => ProtoStr,
);
impl std::fmt::Debug for ProtoString {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> Result<(), std::fmt::Error> {
std::fmt::Debug::fmt(self.as_view(), f)
}
}
impl std::fmt::Debug for ProtoBytes {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> Result<(), std::fmt::Error> {
std::fmt::Debug::fmt(self.as_view(), f)
}
}
unsafe impl Sync for ProtoString {}
unsafe impl Send for ProtoString {}
unsafe impl Send for ProtoBytes {}
unsafe impl Sync for ProtoBytes {}
#[cfg(test)]
mod tests {
use super::*;
use googletest::prelude::*;
fn test_proto_str(bytes: &[u8]) -> &ProtoStr {
unsafe { ProtoStr::from_utf8_unchecked(bytes) }
}
#[gtest]
fn proto_str_debug() {
assert_eq!(&format!("{:?}", test_proto_str(b"Hello There")), "\"Hello There\"");
assert_eq!(
&format!(
"{:?}",
test_proto_str(b"Hello\xC0\x80 There\xE6\x83 Goodbye\xf4\x8d\x93\xaa"),
),
"\"Hello\\xC0\\x80 There\\xE6\\x83 Goodbye\\u{10d4ea}\"",
);
}
#[gtest]
fn proto_str_display() {
assert_eq!(&test_proto_str(b"Hello There").to_string(), "Hello There");
assert_eq!(
&test_proto_str(b"Hello\xC0\x80 There\xE6\x83 Goodbye\xf4\x8d\x93\xaa").to_string(),
"Hello�� There� Goodbye\u{10d4ea}",
);
}
#[gtest]
fn proto_str_to_rust_str() {
assert_eq!(test_proto_str(b"hello").to_str(), Ok("hello"));
assert_eq!(test_proto_str("ศไทย中华Việt Nam".as_bytes()).to_str(), Ok("ศไทย中华Việt Nam"));
for expect_fail in [
&b"Hello\xC2 There\xFF Goodbye"[..],
b"Hello\xC0\x80 There\xE6\x83 Goodbye",
b"\xF5foo\xF5\x80bar",
b"\xF1foo\xF1\x80bar\xF1\x80\x80baz",
b"\xF4foo\xF4\x80bar\xF4\xBFbaz",
b"\xF0\x80\x80\x80foo\xF0\x90\x80\x80bar",
b"\xED\xA0\x80foo\xED\xBF\xBFbar",
] {
assert!(
matches!(test_proto_str(expect_fail).to_str(), Err(Utf8Error { inner: _ })),
"{expect_fail:?}"
);
}
}
#[gtest]
fn proto_str_to_cow() {
assert_eq!(test_proto_str(b"hello").to_cow_lossy(), Cow::Borrowed("hello"));
assert_eq!(
test_proto_str("ศไทย中华Việt Nam".as_bytes()).to_cow_lossy(),
Cow::Borrowed("ศไทย中华Việt Nam")
);
for (bytes, lossy_str) in [
(&b"Hello\xC2 There\xFF Goodbye"[..], "Hello� There� Goodbye"),
(b"Hello\xC0\x80 There\xE6\x83 Goodbye", "Hello�� There� Goodbye"),
(b"\xF5foo\xF5\x80bar", "�foo��bar"),
(b"\xF1foo\xF1\x80bar\xF1\x80\x80baz", "�foo�bar�baz"),
(b"\xF4foo\xF4\x80bar\xF4\xBFbaz", "�foo�bar��baz"),
(b"\xF0\x80\x80\x80foo\xF0\x90\x80\x80bar", "����foo\u{10000}bar"),
(b"\xED\xA0\x80foo\xED\xBF\xBFbar", "���foo���bar"),
] {
let cow = test_proto_str(bytes).to_cow_lossy();
assert!(matches!(cow, Cow::Owned(_)));
assert_eq!(&*cow, lossy_str, "{bytes:?}");
}
}
#[gtest]
fn proto_str_utf8_chunks() {
macro_rules! assert_chunks {
($bytes:expr, $($chunks:expr),* $(,)?) => {
let bytes = $bytes;
let chunks: &[std::result::Result<&str, &[u8]>] = &[$($chunks),*];
let s = test_proto_str(bytes);
let mut got_chunks = s.utf8_chunks();
let mut expected_chars = chunks.iter().copied();
assert!(got_chunks.eq(expected_chars), "{bytes:?} -> {chunks:?}");
};
}
assert_chunks!(b"hello", Ok("hello"));
assert_chunks!("ศไทย中华Việt Nam".as_bytes(), Ok("ศไทย中华Việt Nam"));
assert_chunks!(
b"Hello\xC2 There\xFF Goodbye",
Ok("Hello"),
Err(b"\xC2"),
Ok(" There"),
Err(b"\xFF"),
Ok(" Goodbye"),
);
assert_chunks!(
b"Hello\xC0\x80 There\xE6\x83 Goodbye",
Ok("Hello"),
Err(b"\xC0"),
Err(b"\x80"),
Ok(" There"),
Err(b"\xE6\x83"),
Ok(" Goodbye"),
);
assert_chunks!(
b"\xF5foo\xF5\x80bar",
Err(b"\xF5"),
Ok("foo"),
Err(b"\xF5"),
Err(b"\x80"),
Ok("bar"),
);
assert_chunks!(
b"\xF1foo\xF1\x80bar\xF1\x80\x80baz",
Err(b"\xF1"),
Ok("foo"),
Err(b"\xF1\x80"),
Ok("bar"),
Err(b"\xF1\x80\x80"),
Ok("baz"),
);
assert_chunks!(
b"\xF4foo\xF4\x80bar\xF4\xBFbaz",
Err(b"\xF4"),
Ok("foo"),
Err(b"\xF4\x80"),
Ok("bar"),
Err(b"\xF4"),
Err(b"\xBF"),
Ok("baz"),
);
assert_chunks!(
b"\xF0\x80\x80\x80foo\xF0\x90\x80\x80bar",
Err(b"\xF0"),
Err(b"\x80"),
Err(b"\x80"),
Err(b"\x80"),
Ok("foo\u{10000}bar"),
);
assert_chunks!(
b"\xED\xA0\x80foo\xED\xBF\xBFbar",
Err(b"\xED"),
Err(b"\xA0"),
Err(b"\x80"),
Ok("foo"),
Err(b"\xED"),
Err(b"\xBF"),
Err(b"\xBF"),
Ok("bar"),
);
}
#[gtest]
fn proto_str_chars() {
macro_rules! assert_chars {
($bytes:expr, $chars:expr) => {
let bytes = $bytes;
let chars = $chars;
let s = test_proto_str(bytes);
let mut got_chars = s.chars();
let mut expected_chars = chars.into_iter();
assert!(got_chars.eq(expected_chars), "{bytes:?} -> {chars:?}");
};
}
assert_chars!(b"hello", ['h', 'e', 'l', 'l', 'o']);
assert_chars!(
"ศไทย中华Việt Nam".as_bytes(),
['ศ', 'ไ', 'ท', 'ย', '中', '华', 'V', 'i', 'ệ', 't', ' ', 'N', 'a', 'm']
);
assert_chars!(
b"Hello\xC2 There\xFF Goodbye",
[
'H', 'e', 'l', 'l', 'o', '�', ' ', 'T', 'h', 'e', 'r', 'e', '�', ' ', 'G', 'o',
'o', 'd', 'b', 'y', 'e'
]
);
assert_chars!(
b"Hello\xC0\x80 There\xE6\x83 Goodbye",
[
'H', 'e', 'l', 'l', 'o', '�', '�', ' ', 'T', 'h', 'e', 'r', 'e', '�', ' ', 'G',
'o', 'o', 'd', 'b', 'y', 'e'
]
);
assert_chars!(b"\xF5foo\xF5\x80bar", ['�', 'f', 'o', 'o', '�', '�', 'b', 'a', 'r']);
assert_chars!(
b"\xF1foo\xF1\x80bar\xF1\x80\x80baz",
['�', 'f', 'o', 'o', '�', 'b', 'a', 'r', '�', 'b', 'a', 'z']
);
assert_chars!(
b"\xF4foo\xF4\x80bar\xF4\xBFbaz",
['�', 'f', 'o', 'o', '�', 'b', 'a', 'r', '�', '�', 'b', 'a', 'z']
);
assert_chars!(
b"\xF0\x80\x80\x80foo\xF0\x90\x80\x80bar",
['�', '�', '�', '�', 'f', 'o', 'o', '\u{10000}', 'b', 'a', 'r']
);
assert_chars!(
b"\xED\xA0\x80foo\xED\xBF\xBFbar",
['�', '�', '�', 'f', 'o', 'o', '�', '�', '�', 'b', 'a', 'r']
);
}
}