use std::{borrow::Cow, ffi::CStr, mem::size_of};
use encoding_rs::SHIFT_JIS;
use itertools::Itertools;
use zerocopy::{FromBytes, FromZeros, Immutable, IntoBytes, KnownLayout, big_endian::*};
use crate::{
Error, Result,
util::{array_ref, static_assert},
};
#[derive(Clone, Debug, PartialEq)]
pub enum NodeKind {
File,
Directory,
Invalid,
}
#[derive(Copy, Clone, Debug, PartialEq, FromBytes, IntoBytes, Immutable, KnownLayout)]
#[repr(C, align(4))]
pub struct Node {
kind: u8,
name_offset: [u8; 3],
offset: U32,
length: U32,
}
static_assert!(size_of::<Node>() == 12);
impl Node {
#[inline]
pub fn new(kind: NodeKind, name_offset: u32, offset: u64, length: u32, is_wii: bool) -> Self {
let name_offset_bytes = name_offset.to_be_bytes();
Self {
kind: match kind {
NodeKind::File => 0,
NodeKind::Directory => 1,
NodeKind::Invalid => u8::MAX,
},
name_offset: *array_ref![name_offset_bytes, 1, 3],
offset: U32::new(match kind {
NodeKind::File if is_wii => (offset / 4) as u32,
_ => offset as u32,
}),
length: U32::new(length),
}
}
#[inline]
pub fn kind(&self) -> NodeKind {
match self.kind {
0 => NodeKind::File,
1 => NodeKind::Directory,
_ => NodeKind::Invalid,
}
}
#[inline]
pub fn set_kind(&mut self, kind: NodeKind) {
self.kind = match kind {
NodeKind::File => 0,
NodeKind::Directory => 1,
NodeKind::Invalid => u8::MAX,
};
}
#[inline]
pub fn is_file(&self) -> bool { self.kind == 0 }
#[inline]
pub fn is_dir(&self) -> bool { self.kind == 1 }
#[inline]
pub fn name_offset(&self) -> u32 {
u32::from_be_bytes([0, self.name_offset[0], self.name_offset[1], self.name_offset[2]])
}
#[inline]
pub fn set_name_offset(&mut self, name_offset: u32) {
let name_offset_bytes = name_offset.to_be_bytes();
self.name_offset = *array_ref![name_offset_bytes, 1, 3];
}
#[inline]
pub fn offset(&self, is_wii: bool) -> u64 {
if is_wii && self.is_file() {
self.offset.get() as u64 * 4
} else {
self.offset.get() as u64
}
}
#[inline]
pub fn set_offset(&mut self, offset: u64, is_wii: bool) {
self.offset.set(if is_wii && self.is_file() { (offset / 4) as u32 } else { offset as u32 });
}
#[inline]
pub fn length(&self) -> u32 { self.length.get() }
#[inline]
pub fn set_length(&mut self, length: u32) { self.length.set(length); }
}
#[derive(Clone)]
pub struct Fst<'a> {
pub nodes: &'a [Node],
pub string_table: &'a [u8],
}
impl<'a> Fst<'a> {
pub fn new(buf: &'a [u8]) -> Result<Self, &'static str> {
let Ok((root_node, _)) = Node::ref_from_prefix(buf) else {
return Err("FST root node not found");
};
let string_base = root_node.length() * size_of::<Node>() as u32;
if string_base > buf.len() as u32 {
return Err("FST string table out of bounds");
}
let (node_buf, string_table) = buf.split_at(string_base as usize);
let nodes = <[Node]>::ref_from_bytes(node_buf).unwrap();
Ok(Self { nodes, string_table })
}
#[inline]
pub fn iter(&self) -> FstIter<'_> { FstIter { fst: self.clone(), idx: 1, segments: vec![] } }
pub fn get_name(&self, node: Node) -> Result<Cow<'a, str>, String> {
let name_buf = self.string_table.get(node.name_offset() as usize..).ok_or_else(|| {
format!(
"FST: name offset {} out of bounds (string table size: {})",
node.name_offset(),
self.string_table.len()
)
})?;
let c_string = CStr::from_bytes_until_nul(name_buf).map_err(|_| {
format!("FST: name at offset {} not null-terminated", node.name_offset())
})?;
let (decoded, _, _) = SHIFT_JIS.decode(c_string.to_bytes());
Ok(decoded)
}
pub fn find(&self, path: &str) -> Option<(usize, Node)> {
let mut split = path.trim_matches('/').split('/');
let mut current = next_non_empty(&mut split);
if current.is_empty() {
return Some((0, self.nodes[0]));
}
let mut idx = 1;
let mut stop_at = None;
while let Some(node) = self.nodes.get(idx).copied() {
if self.get_name(node).as_ref().is_ok_and(|name| name.eq_ignore_ascii_case(current)) {
current = next_non_empty(&mut split);
if current.is_empty() {
return Some((idx, node));
}
idx += 1;
stop_at = Some(node.length() as usize + idx);
} else if node.is_dir() {
idx = node.length() as usize;
} else {
idx += 1;
}
if let Some(stop) = stop_at {
if idx >= stop {
break;
}
}
}
None
}
pub fn num_files(&self) -> usize { self.nodes.iter().filter(|n| n.is_file()).count() }
}
pub struct FstIter<'a> {
fst: Fst<'a>,
idx: usize,
segments: Vec<(Cow<'a, str>, usize)>,
}
impl Iterator for FstIter<'_> {
type Item = (usize, Node, String);
fn next(&mut self) -> Option<Self::Item> {
let idx = self.idx;
let node = self.fst.nodes.get(idx).copied()?;
let name = self.fst.get_name(node).unwrap_or("<invalid>".into());
self.idx += 1;
let mut new_size = 0;
for (_, end) in self.segments.iter() {
if *end == idx {
break;
}
new_size += 1;
}
self.segments.truncate(new_size);
let length = node.length() as u64;
let end = if node.is_dir() { length as usize } else { idx + 1 };
self.segments.push((name, end));
let path = self.segments.iter().map(|(name, _)| name.as_ref()).join("/");
Some((idx, node, path))
}
}
#[inline]
fn next_non_empty<'a>(iter: &mut impl Iterator<Item = &'a str>) -> &'a str {
loop {
match iter.next() {
Some("") => continue,
Some(next) => break next,
None => break "",
}
}
}
pub struct FstBuilder {
nodes: Vec<Node>,
string_table: Vec<u8>,
stack: Vec<(String, u32)>,
is_wii: bool,
}
impl FstBuilder {
pub fn new(is_wii: bool) -> Self {
let mut builder = Self { nodes: vec![], string_table: vec![], stack: vec![], is_wii };
builder.add_node(NodeKind::Directory, "<root>", 0, 0);
builder
}
pub fn new_with_string_table(is_wii: bool, string_table: Vec<u8>) -> Result<Self> {
if matches!(string_table.last(), Some(n) if *n != 0) {
return Err(Error::DiscFormat("String table must be null-terminated".to_string()));
}
let root_name = CStr::from_bytes_until_nul(&string_table)
.map_err(|_| {
Error::DiscFormat("String table root name not null-terminated".to_string())
})?
.to_str()
.unwrap_or("<root>")
.to_string();
let mut builder = Self { nodes: vec![], string_table, stack: vec![], is_wii };
builder.add_node(NodeKind::Directory, &root_name, 0, 0);
Ok(builder)
}
pub fn add_file(&mut self, path: &str, offset: u64, size: u32) {
let components = path.split('/').collect::<Vec<_>>();
for i in 0..components.len() - 1 {
if matches!(self.stack.get(i), Some((name, _)) if name != components[i]) {
while self.stack.len() > i {
let (_, idx) = self.stack.pop().unwrap();
let length = self.nodes.len() as u32;
self.nodes[idx as usize].set_length(length);
}
}
while i >= self.stack.len() {
let component_idx = self.stack.len();
let parent = if component_idx == 0 { 0 } else { self.stack[component_idx - 1].1 };
let node_idx =
self.add_node(NodeKind::Directory, components[component_idx], parent as u64, 0);
self.stack.push((components[i].to_string(), node_idx));
}
}
if components.len() == 1 {
while let Some((_, idx)) = self.stack.pop() {
let length = self.nodes.len() as u32;
self.nodes[idx as usize].set_length(length);
}
}
self.add_node(NodeKind::File, components.last().unwrap(), offset, size);
}
pub fn byte_size(&self) -> usize {
size_of_val(self.nodes.as_slice()) + self.string_table.len()
}
pub fn finalize(mut self) -> Box<[u8]> {
let node_count = self.nodes.len() as u32;
while let Some((_, idx)) = self.stack.pop() {
self.nodes[idx as usize].set_length(node_count);
}
self.nodes[0].set_length(node_count);
let nodes_data = self.nodes.as_bytes();
let string_table_data = self.string_table.as_bytes();
let mut data =
<[u8]>::new_box_zeroed_with_elems(nodes_data.len() + string_table_data.len()).unwrap();
data[..nodes_data.len()].copy_from_slice(self.nodes.as_bytes());
data[nodes_data.len()..].copy_from_slice(self.string_table.as_bytes());
data
}
fn add_node(&mut self, kind: NodeKind, name: &str, offset: u64, length: u32) -> u32 {
let (bytes, _, _) = SHIFT_JIS.encode(name);
let mut name_offset = 0;
while name_offset < self.string_table.len() {
let string_buf = &self.string_table[name_offset..];
let existing = CStr::from_bytes_until_nul(string_buf).unwrap();
if existing.to_bytes() == bytes.as_ref() {
break;
}
name_offset += existing.to_bytes_with_nul().len();
}
if name_offset == self.string_table.len() {
self.string_table.extend_from_slice(bytes.as_ref());
self.string_table.push(0);
}
let idx = self.nodes.len() as u32;
self.nodes.push(Node::new(kind, name_offset as u32, offset, length, self.is_wii));
idx
}
}