use proptest::prelude::*;
pub fn unicode_string() -> impl Strategy<Value = String> {
prop_oneof![
prop::collection::vec(
prop_oneof![
prop::char::range('a', 'z'),
prop::char::range('A', 'Z'),
prop::char::range('0', '9'),
Just(' '),
Just('\t'),
],
0..=50_usize,
)
.prop_map(|chars| chars.into_iter().collect()),
prop::collection::vec(prop::char::range('\u{00C0}', '\u{FFFF}'), 0..=50_usize)
.prop_map(|chars| chars.into_iter().collect()),
prop::collection::vec(prop::char::range('\u{10000}', '\u{10FFFF}'), 0..=30_usize)
.prop_map(|chars| chars.into_iter().collect()),
prop::collection::vec(
prop_oneof![
prop::char::range('a', 'z'),
prop::char::range('A', 'Z'),
prop::char::range('0', '9'),
prop::char::range('\u{00C0}', '\u{024F}'),
prop::char::range('\u{4E00}', '\u{9FFF}'),
prop::char::range('\u{10000}', '\u{10FFFF}'),
Just('\t'),
Just('\n'),
],
0..=100_usize,
)
.prop_map(|chars| chars.into_iter().collect()),
]
}
pub fn non_empty_unicode_string() -> impl Strategy<Value = String> {
unicode_string().prop_filter("string must be non-empty", |value| !value.is_empty())
}
#[cfg(test)]
mod tests {
use super::*;
proptest! {
#[test]
fn unicode_string_is_valid_utf8(s in unicode_string()) {
let bytes = s.as_bytes();
match std::str::from_utf8(bytes) {
Ok(roundtrip) => prop_assert_eq!(s.as_str(), roundtrip),
Err(err) => prop_assert!(false, "generated string was not valid UTF-8: {err}"),
}
}
#[test]
fn utf16_len_agrees_with_encode_utf16(s in unicode_string()) {
let encoded: Vec<u16> = s.encode_utf16().collect();
let from_utf16 = String::from_utf16_lossy(&encoded);
prop_assert_eq!(s, from_utf16);
}
#[test]
fn non_empty_unicode_string_never_empty(s in non_empty_unicode_string()) {
prop_assert!(!s.is_empty(), "non-empty strategy produced an empty string");
}
}
}