use std::collections::BTreeSet;
use std::rc::Rc;
use crate::errors::{Error, Result};
use crate::property_info_parser::*;
use crate::trie_builder::*;
use crate::trie_node_arena::TrieNodeArena;
pub(crate) struct TrieSerializer {
arena: TrieNodeArena,
}
fn resolve_index<F>(name: Option<&str>, mut lookup: F) -> u32
where
F: FnMut(&str) -> Option<usize>,
{
match name {
Some(s) if !s.is_empty() => lookup(s)
.and_then(|i| u32::try_from(i).ok())
.unwrap_or(u32::MAX),
_ => u32::MAX,
}
}
impl TrieSerializer {
pub(crate) fn new(trie_builder: &TrieBuilder) -> Result<Self> {
let mut this = Self {
arena: TrieNodeArena::new(),
};
let header_offset = this.arena.allocate_object::<PropertyInfoAreaHeader>();
{
let header = this
.arena
.get_object::<PropertyInfoAreaHeader>(header_offset)?;
header.current_version = 1;
header.minimum_supported_version = 1;
}
this.arena
.get_object::<PropertyInfoAreaHeader>(header_offset)?
.contexts_offset = this.arena.size() as u32;
this.serialize_strings(&trie_builder.contexts)?;
this.arena
.get_object::<PropertyInfoAreaHeader>(header_offset)?
.types_offset = this.arena.size() as u32;
this.serialize_strings(&trie_builder.types)?;
this.arena
.get_object::<PropertyInfoAreaHeader>(header_offset)?
.size = this.arena.size() as u32;
let root_trie_offset = this.write_trie_node(&trie_builder.root)?;
this.arena
.get_object::<PropertyInfoAreaHeader>(header_offset)?
.root_offset = root_trie_offset;
let final_size = this.arena.size();
this.arena
.get_object::<PropertyInfoAreaHeader>(header_offset)?
.size = final_size as u32;
Ok(this)
}
fn write_property_entry(&mut self, property_entry: &PropertyEntryBuilder) -> Result<u32> {
let context_index =
resolve_index(property_entry.context.as_ref().map(|s| s.as_str()), |s| {
self.arena.info().find_context_index(s)
});
let type_index = resolve_index(property_entry.rtype.as_ref().map(|s| s.as_str()), |s| {
self.arena.info().find_type_index(s)
});
let entry_offset = self.arena.allocate_object::<PropertyEntry>();
let name_offset = self.arena.allocate_and_write_string(&property_entry.name) as u32;
let namelen = u32::try_from(property_entry.name.len()).map_err(|_| {
Error::FileValidation(format!(
"Property name too long: {} bytes",
property_entry.name.len()
))
})?;
let entry = self.arena.get_object::<PropertyEntry>(entry_offset)?;
entry.name_offset = name_offset;
entry.namelen = namelen;
entry.context_index = context_index;
entry.type_index = type_index;
Ok(entry_offset as u32)
}
fn write_trie_node(&mut self, builder_node: &TrieBuilderNode) -> Result<u32> {
let trie_offset = self.arena.allocate_object::<TrieNodeData>();
let property_entry = self.write_property_entry(&builder_node.property_entry)?;
self.arena
.get_object::<TrieNodeData>(trie_offset)?
.property_entry = property_entry;
let mut sorted_prefix_matches: Vec<_> = builder_node.prefixes.iter().collect();
sorted_prefix_matches.sort_by_key(|b| std::cmp::Reverse(b.name.len()));
self.arena
.get_object::<TrieNodeData>(trie_offset)?
.num_prefixes = sorted_prefix_matches.len() as u32;
let prefix_entries_array_offset = self
.arena
.allocate_uint32_array(sorted_prefix_matches.len());
self.arena
.get_object::<TrieNodeData>(trie_offset)?
.prefix_entries = prefix_entries_array_offset as u32;
let prefix_count = sorted_prefix_matches.len();
for (i, prefix_entry) in sorted_prefix_matches.iter().enumerate() {
let offset = self.write_property_entry(prefix_entry)?;
self.arena
.uint32_array(prefix_entries_array_offset, prefix_count)?[i] = offset;
}
let mut sorted_exact_matches: Vec<_> = builder_node.exact_matches.iter().collect();
sorted_exact_matches.sort_by(|a, b| a.name.cmp(&b.name));
self.arena
.get_object::<TrieNodeData>(trie_offset)?
.num_exact_matches = sorted_exact_matches.len() as u32;
let exact_match_entries_array_offset =
self.arena.allocate_uint32_array(sorted_exact_matches.len());
self.arena
.get_object::<TrieNodeData>(trie_offset)?
.exact_match_entries = exact_match_entries_array_offset as u32;
let exact_count = sorted_exact_matches.len();
for (i, exact_entry) in sorted_exact_matches.iter().enumerate() {
let offset = self.write_property_entry(exact_entry)?;
self.arena
.uint32_array(exact_match_entries_array_offset, exact_count)?[i] = offset;
}
let mut sorted_children: Vec<_> = builder_node.children.values().collect();
sorted_children.sort_by(|a, b| a.property_entry.name.cmp(&b.property_entry.name));
self.arena
.get_object::<TrieNodeData>(trie_offset)?
.num_child_nodes = sorted_children.len() as u32;
let children_offset_array_offset = self.arena.allocate_uint32_array(sorted_children.len());
self.arena
.get_object::<TrieNodeData>(trie_offset)?
.child_nodes = children_offset_array_offset as u32;
let children_count = sorted_children.len();
for (i, child_node) in sorted_children.iter().enumerate() {
let child_offset = self.write_trie_node(child_node)?;
self.arena
.uint32_array(children_offset_array_offset, children_count)?[i] = child_offset;
}
Ok(trie_offset as u32)
}
fn serialize_strings(&mut self, strings: &BTreeSet<Rc<String>>) -> Result<()> {
self.arena.allocate_and_write_uint32(strings.len() as u32);
let n = strings.len();
let offset_array_offset = self.arena.allocate_uint32_array(n);
for (i, string) in strings.iter().enumerate() {
let offset = self.arena.allocate_and_write_string(string);
self.arena.uint32_array(offset_array_offset, n)?[i] = offset as u32;
}
Ok(())
}
pub(crate) fn into_data(self) -> Vec<u8> {
self.arena.into_data()
}
}