use core::fmt;
use crate::Decoder;
use crate::data::{Tag, Type};
use crate::decode::Error;
#[derive(Debug, Clone, Copy, PartialEq)]
pub enum Token<'b> {
Bool(bool),
U8(u8),
U16(u16),
U32(u32),
U64(u64),
I8(i8),
I16(i16),
I32(i32),
I64(i64),
F16(f32),
F32(f32),
F64(f64),
Bytes(&'b [u8]),
String(&'b str),
Array(u64),
Map(u64),
Tag(Tag),
Simple(u8),
Break,
Null,
Undefined,
BeginBytes,
BeginString,
BeginArray,
BeginMap
}
#[derive(Debug, Clone)]
pub struct Tokenizer<'b> {
decoder: Decoder<'b>
}
impl<'b> Iterator for Tokenizer<'b> {
type Item = Result<Token<'b>, Error>;
fn next(&mut self) -> Option<Self::Item> {
match self.token() {
Ok(t) => Some(Ok(t)),
Err(Error::EndOfInput) => None,
Err(e) => Some(Err(e))
}
}
}
impl<'b> From<Decoder<'b>> for Tokenizer<'b> {
fn from(d: Decoder<'b>) -> Self {
Tokenizer { decoder: d }
}
}
impl<'b> Tokenizer<'b> {
pub fn new(bytes: &'b[u8]) -> Self {
Tokenizer { decoder: Decoder::new(bytes) }
}
pub fn token(&mut self) -> Result<Token<'b>, Error> {
match self.decoder.datatype()? {
Type::Bool => self.decoder.bool().map(Token::Bool),
Type::U8 => self.decoder.u8().map(Token::U8),
Type::U16 => self.decoder.u16().map(Token::U16),
Type::U32 => self.decoder.u32().map(Token::U32),
Type::U64 => self.decoder.u64().map(Token::U64),
Type::I8 => self.decoder.i8().map(Token::I8),
Type::I16 => self.decoder.i16().map(Token::I16),
Type::I32 => self.decoder.i32().map(Token::I32),
Type::I64 => self.decoder.i64().map(Token::I64),
Type::F16 => self.decoder.f16().map(Token::F16),
Type::F32 => self.decoder.f32().map(Token::F32),
Type::F64 => self.decoder.f64().map(Token::F64),
Type::Bytes => self.decoder.bytes().map(Token::Bytes),
Type::String => self.decoder.str().map(Token::String),
Type::Tag => self.decoder.tag().map(Token::Tag),
Type::Simple => self.decoder.simple().map(Token::Simple),
Type::Array => self.decoder.array().map(|n| Token::Array(n.expect("array len"))),
Type::Map => self.decoder.map().map(|n| Token::Map(n.expect("map len"))),
Type::BytesIndef => { self.skip_byte(); Ok(Token::BeginBytes) }
Type::StringIndef => { self.skip_byte(); Ok(Token::BeginString) }
Type::ArrayIndef => { self.skip_byte(); Ok(Token::BeginArray) }
Type::MapIndef => { self.skip_byte(); Ok(Token::BeginMap) }
Type::Null => { self.skip_byte(); Ok(Token::Null) }
Type::Undefined => { self.skip_byte(); Ok(Token::Undefined) }
Type::Break => { self.skip_byte(); Ok(Token::Break) }
Type::Unknown(n) => Err(Error::TypeMismatch(n, "unknown cbor type"))
}
}
fn skip_byte(&mut self) {
self.decoder.set_position(self.decoder.position() + 1)
}
}
#[cfg(feature = "std")]
impl fmt::Display for Tokenizer<'_> {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
enum E {
N,
T,
A(Option<u64>),
M(Option<u64>),
B,
D,
S(&'static str),
X(&'static str)
}
let mut iter = Tokenizer::from(self.decoder.clone()).peekable();
let mut stack = Vec::new();
while iter.peek().is_some() {
stack.push(E::N);
while let Some(elt) = stack.pop() {
match elt {
E::N => match iter.next() {
Some(Ok(Token::Array(n))) => {
stack.push(E::A(Some(n)));
f.write_str("[")?
}
Some(Ok(Token::Map(n))) => {
stack.push(E::M(Some(n)));
f.write_str("{")?
}
Some(Ok(Token::BeginArray)) => {
stack.push(E::A(None));
f.write_str("[_ ")?
}
Some(Ok(Token::BeginMap)) => {
stack.push(E::M(None));
f.write_str("{_ ")?
}
Some(Ok(Token::BeginBytes)) => if let Some(Ok(Token::Break)) = iter.peek() {
iter.next();
f.write_str("''_")?
} else {
stack.push(E::B);
f.write_str("(_ ")?
}
Some(Ok(Token::BeginString)) => if let Some(Ok(Token::Break)) = iter.peek() {
iter.next();
f.write_str("\"\"_")?
} else {
stack.push(E::D);
f.write_str("(_ ")?
}
Some(Ok(Token::Tag(t))) => {
stack.push(E::T);
write!(f, "{}(", t.numeric())?
}
Some(Ok(t)) => t.fmt(f)?,
Some(Err(e)) => {
write!(f, " !!! decoding error: {}", e)?;
return Ok(())
}
None => continue
}
E::S(s) => f.write_str(s)?,
E::X(s) => match iter.peek() {
Some(Ok(Token::Break)) | None => continue,
Some(Ok(_)) => f.write_str(s)?,
Some(Err(e)) => {
write!(f, " !!! decoding error: {}", e)?;
return Ok(())
}
}
E::T => {
stack.push(E::S(")"));
stack.push(E::N)
}
E::A(Some(0)) => f.write_str("]")?,
E::A(Some(1)) => {
stack.push(E::A(Some(0)));
stack.push(E::N)
}
E::A(Some(n)) => {
stack.push(E::A(Some(n - 1)));
stack.push(E::S(", "));
stack.push(E::N)
}
E::A(None) => if let Some(Ok(Token::Break)) = iter.peek() {
iter.next();
f.write_str("]")?
} else {
stack.push(E::A(None));
stack.push(E::X(", "));
stack.push(E::N)
}
E::M(Some(0)) => f.write_str("}")?,
E::M(Some(1)) => {
stack.push(E::M(Some(0)));
stack.push(E::N);
stack.push(E::S(": "));
stack.push(E::N)
}
E::M(Some(n)) => {
stack.push(E::M(Some(n - 1)));
stack.push(E::S(", "));
stack.push(E::N);
stack.push(E::S(": "));
stack.push(E::N)
}
E::M(None) => if let Some(Ok(Token::Break)) = iter.peek() {
iter.next();
f.write_str("}")?
} else {
stack.push(E::M(None));
stack.push(E::X(", "));
stack.push(E::N);
stack.push(E::S(": "));
stack.push(E::N)
}
E::B => if let Some(Ok(Token::Break)) = iter.peek() {
iter.next();
f.write_str(")")?
} else {
stack.push(E::B);
stack.push(E::X(", "));
stack.push(E::N)
}
E::D => if let Some(Ok(Token::Break)) = iter.peek() {
iter.next();
f.write_str(")")?
} else {
stack.push(E::D);
stack.push(E::X(", "));
stack.push(E::N)
}
}
}
}
Ok(())
}
}
impl fmt::Display for Token<'_> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
Token::Bool(b) => write!(f, "{}", b),
Token::U8(n) => write!(f, "{}", n),
Token::U16(n) => write!(f, "{}", n),
Token::U32(n) => write!(f, "{}", n),
Token::U64(n) => write!(f, "{}", n),
Token::I8(n) => write!(f, "{}", n),
Token::I16(n) => write!(f, "{}", n),
Token::I32(n) => write!(f, "{}", n),
Token::I64(n) => write!(f, "{}", n),
Token::F16(n) => write!(f, "{:e}", n),
Token::F32(n) => write!(f, "{:e}", n),
Token::F64(n) => write!(f, "{:e}", n),
Token::String(n) => write!(f, "\"{}\"", n),
Token::Array(n) => write!(f, "A[{}]", n),
Token::Map(n) => write!(f, "M[{}]", n),
Token::Tag(t) => write!(f, "T({})", t.numeric()),
Token::Simple(n) => write!(f, "simple({})", n),
Token::Break => f.write_str("]"),
Token::Null => f.write_str("null"),
Token::Undefined => f.write_str("undefined"),
Token::BeginBytes => f.write_str("?B["),
Token::BeginString => f.write_str("?S["),
Token::BeginArray => f.write_str("?A["),
Token::BeginMap => f.write_str("?M["),
Token::Bytes(b) => {
f.write_str("h'")?;
let mut i = b.len();
for x in *b {
if i > 1 {
write!(f, "{:02x} ", x)?
} else {
write!(f, "{:02x}", x)?
}
i -= 1;
}
f.write_str("'")
}
}
}
}