use crate::SourceDataProvider;
use icu::collections::codepointinvlist::CodePointInversionListBuilder;
use icu::collections::codepointinvliststringlist::CodePointInversionListAndStringList;
use icu::properties::props::EmojiSet;
use icu::properties::provider::*;
use icu_provider::prelude::*;
use std::collections::HashSet;
use zerovec::VarZeroVec;
impl SourceDataProvider {
fn get_binary_prop_for_unicodeset<'a>(
&'a self,
name: &str,
short_name: &str,
) -> Result<&'a super::uprops_serde::binary::BinaryProperty, DataError> {
let data = self
.icuexport()?
.read_and_parse_toml::<super::uprops_serde::binary::Main>(&format!(
"uprops/{}/{}.toml",
self.trie_type(),
short_name
))?
.binary_property
.first()
.ok_or_else(|| DataErrorKind::MarkerNotFound.into_error())?;
if name != data.long_name
|| short_name != data.short_name.as_ref().unwrap_or(&data.long_name)
{
return Err(DataError::custom("Property name mismatch").with_display_context(name));
}
Ok(data)
}
}
impl super::uprops_serde::binary::BinaryProperty {
fn build_uniset(&self) -> Result<CodePointInversionListAndStringList<'static>, DataError> {
let mut builder = CodePointInversionListBuilder::new();
for (start, end) in &self.ranges {
builder.add_range32(start..=end);
}
let inv_list = builder.build();
let strings = self.strings.as_ref().ok_or(DataError::custom(
"Error in deserializing strings from BinaryProperty source data",
))?;
let string_list = VarZeroVec::<str>::from(strings);
CodePointInversionListAndStringList::try_from(inv_list, string_list)
.map_err(|_| DataError::custom("Error in constructing CodePointInversionListAndStringList from deserialized BinaryProperty data"))
}
}
macro_rules! expand {
($(($prop:ty, $marker:ident)),+) => {
$(
impl DataProvider<$marker> for SourceDataProvider {
fn load(
&self,
req: DataRequest,
) -> Result<DataResponse<$marker>, DataError> {
self.check_req::<$marker>(req)?;
let data = self.get_binary_prop_for_unicodeset(
core::str::from_utf8(<$prop as EmojiSet>::NAME).unwrap(),
core::str::from_utf8(<$prop as EmojiSet>::SHORT_NAME).unwrap()
)?;
Ok(DataResponse {
metadata: Default::default(),
payload: DataPayload::from_owned(PropertyUnicodeSet::CPInversionListStrList(data.build_uniset()?)),
})
}
}
impl crate::IterableDataProviderCached<$marker> for SourceDataProvider {
fn iter_ids_cached(&self) -> Result<HashSet<DataIdentifierCow<'static>>, DataError> {
Ok(HashSet::from_iter([Default::default()]))
}
}
)+
};
}
expand!((
icu::properties::props::BasicEmoji,
PropertyBinaryBasicEmojiV1
));
#[test]
fn test_basic() {
use icu::properties::{props::BasicEmoji, EmojiSetData};
let provider = SourceDataProvider::new_testing();
let basic_emoji = EmojiSetData::try_new_unstable::<BasicEmoji>(&provider).unwrap();
let basic_emoji = basic_emoji
.as_code_point_inversion_list_string_list()
.unwrap();
assert!(!basic_emoji.contains32(0x0020));
assert!(!basic_emoji.contains('\n'));
assert!(basic_emoji.contains('🦃')); assert!(basic_emoji.contains_str("\u{1F983}"));
assert!(basic_emoji.contains_str("\u{1F6E4}\u{FE0F}")); assert!(!basic_emoji.contains_str("\u{0033}\u{FE0F}\u{20E3}")); }