use crate::error::{self, ExpectedKind, Received, is_eof_io_error, io_syntax_error}; use num::bigint::BigInt; use num::traits::cast::{FromPrimitive, ToPrimitive}; use std::borrow::Cow; use std::convert::TryFrom; use std::convert::TryInto; use std::io; use std::marker::PhantomData; use super::constants::Tag; use super::super::{ CompoundClass, DomainDecode, Embeddable, Map, NestedValue, Record, Set, Value, reader::{ Token, BinarySource, Reader, ReaderResult, }, repr::Annotations, signed_integer::SignedInteger, }; pub struct PackedReader<'de, 'src, D: Embeddable, N: NestedValue, Dec: DomainDecode, S: BinarySource<'de>> { pub source: &'src mut S, pub decode_embedded: Dec, phantom: PhantomData<&'de (D, N)>, } impl<'de, 'src, D: Embeddable, N: NestedValue, Dec: DomainDecode, S: BinarySource<'de>> BinarySource<'de> for PackedReader<'de, 'src, D, N, Dec, S> { type Mark = S::Mark; fn mark(&mut self) -> io::Result { self.source.mark() } fn restore(&mut self, mark: &Self::Mark) -> io::Result<()> { self.source.restore(mark) } fn skip(&mut self) -> io::Result<()> { self.source.skip() } fn peek(&mut self) -> io::Result { self.source.peek() } fn readbytes(&mut self, count: usize) -> io::Result> { self.source.readbytes(count) } fn readbytes_into(&mut self, bs: &mut [u8]) -> io::Result<()> { self.source.readbytes_into(bs) } } fn out_of_range>(i: I) -> error::Error { error::Error::NumberOutOfRange(i.into()) } impl<'de, 'src, D: Embeddable, N: NestedValue, Dec: DomainDecode, S: BinarySource<'de>> PackedReader<'de, 'src, D, N, Dec, S> { pub fn new(source: &'src mut S, decode_embedded: Dec) -> Self { PackedReader { source, decode_embedded, phantom: PhantomData } } fn read(&mut self) -> io::Result { let v = self.peek()?; self.skip()?; Ok(v) } fn expected(&mut self, k: ExpectedKind) -> error::Error { match self.demand_next(true) { Ok(v) => error::Error::Expected(k, Received::ReceivedOtherValue(format!("{:?}", v))), Err(e) => e.into() } } fn varint(&mut self) -> io::Result { let mut shift = 0; let mut acc: usize = 0; loop { let v = self.read()?; acc |= ((v & 0x7f) as usize) << shift; shift += 7; if v & 0x80 == 0 { return Ok(acc) } } } fn peekend(&mut self) -> io::Result { if self.peek()? == Tag::End.into() { self.skip()?; Ok(true) } else { Ok(false) } } fn peek_next_nonannotation_tag(&mut self) -> ReaderResult { loop { match Tag::try_from(self.peek()?)? { Tag::Annotation => { self.skip()?; self.skip_value()?; }, other => return Ok(other), } } } fn next_atomic(&mut self, expected_tag: Tag, k: ExpectedKind) -> ReaderResult> { let actual_tag = self.peek_next_nonannotation_tag()?; if actual_tag == expected_tag { self.skip()?; let count = self.varint()?; Ok(self.readbytes(count)?) } else { Err(self.expected(k)) } } fn next_compound(&mut self, expected_tag: Tag, k: ExpectedKind) -> ReaderResult<()> { let actual_tag = self.peek_next_nonannotation_tag()?; if actual_tag == expected_tag { self.skip()?; Ok(()) } else { Err(self.expected(k)) } } fn read_signed_integer(&mut self, count: usize) -> io::Result { if count == 0 { return Ok(SignedInteger::from(0_i128)); } if count > 16 { let bs = self.readbytes(count)?; if (bs[0] & 0x80) == 0 { // Positive or zero. let mut i = 0; while i < count && bs[i] == 0 { i += 1; } if count - i <= 16 { Ok(SignedInteger::from(u128::from_be_bytes(bs[bs.len() - 16..].try_into().unwrap()))) } else { Ok(SignedInteger::from(Cow::Owned(BigInt::from_bytes_be(num::bigint::Sign::Plus, &bs[i..])))) } } else { // Negative. let mut i = 0; while i < count && bs[i] == 0xff { i += 1; } if count - i <= 16 { Ok(SignedInteger::from(i128::from_be_bytes(bs[bs.len() - 16..].try_into().unwrap()))) } else { Ok(SignedInteger::from(Cow::Owned(BigInt::from_signed_bytes_be(&bs)))) } } } else { let first_byte = self.read()?; let prefix_byte = if (first_byte & 0x80) == 0 { 0x00 } else { 0xff }; let mut bs = [prefix_byte; 16]; bs[16 - count] = first_byte; self.readbytes_into(&mut bs[16 - (count - 1)..])?; Ok(SignedInteger::from(i128::from_be_bytes(bs))) } } fn next_unsigned(&mut self, f: F) -> ReaderResult where F: FnOnce(u128) -> Option { let tag = self.peek_next_nonannotation_tag()?; match tag { Tag::SmallInteger(v) => { self.skip()?; if v < 0 { Err(out_of_range(v)) } else { f(v as u128).ok_or_else(|| out_of_range(v)) } } Tag::MediumInteger(count) => { self.skip()?; let n = &self.read_signed_integer(count.into())?; let i = n.try_into().map_err(|_| out_of_range(n))?; f(i).ok_or_else(|| out_of_range(i)) } Tag::SignedInteger => { self.skip()?; let count = self.varint()?; let n = &self.read_signed_integer(count)?; let i = n.try_into().map_err(|_| out_of_range(n))?; f(i).ok_or_else(|| out_of_range(i)) } _ => Err(self.expected(ExpectedKind::SignedInteger)) } } fn next_signed(&mut self, f: F) -> ReaderResult where F: FnOnce(i128) -> Option { let tag = self.peek_next_nonannotation_tag()?; match tag { Tag::SmallInteger(v) => { self.skip()?; f(v.into()).ok_or_else(|| out_of_range(v)) } Tag::MediumInteger(count) => { self.skip()?; let n = &self.read_signed_integer(count.into())?; let i = n.try_into().map_err(|_| out_of_range(n))?; f(i).ok_or_else(|| out_of_range(i)) } Tag::SignedInteger => { self.skip()?; let count = self.varint()?; let n = &self.read_signed_integer(count)?; let i = n.try_into().map_err(|_| out_of_range(n))?; f(i).ok_or_else(|| out_of_range(i)) } _ => Err(self.expected(ExpectedKind::SignedInteger)) } } fn gather_annotations(&mut self) -> io::Result> { let mut annotations = vec![self.demand_next(true)?]; while Tag::try_from(self.peek()?)? == Tag::Annotation { self.skip()?; annotations.push(self.demand_next(true)?); } Ok(annotations) } fn skip_annotations(&mut self) -> io::Result<()> { self.skip_value()?; while Tag::try_from(self.peek()?)? == Tag::Annotation { self.skip()?; self.skip_value()?; } Ok(()) } fn next_upto_end(&mut self, read_annotations: bool) -> io::Result> { match self.peekend()? { true => Ok(None), false => Ok(Some(self.demand_next(read_annotations)?)), } } } impl<'de, 'src, D: Embeddable, N: NestedValue, Dec: DomainDecode, S: BinarySource<'de>> Reader<'de, D, N> for PackedReader<'de, 'src, D, N, Dec, S> { fn next(&mut self, read_annotations: bool) -> io::Result> { match self.peek() { Err(e) if is_eof_io_error(&e) => return Ok(None), Err(e) => return Err(e), Ok(_) => (), } Ok(Some(match Tag::try_from(self.read()?)? { Tag::False => N::new(false), Tag::True => N::new(true), Tag::Float => { let mut bs = [0; 4]; self.readbytes_into(&mut bs)?; Value::from(f32::from_bits(u32::from_be_bytes(bs))).wrap() } Tag::Double => { let mut bs = [0; 8]; self.readbytes_into(&mut bs)?; Value::from(f64::from_bits(u64::from_be_bytes(bs))).wrap() } Tag::Annotation => { if read_annotations { let mut annotations = self.gather_annotations()?; let (existing_annotations, v) = self.demand_next(read_annotations)?.pieces(); annotations.extend_from_slice(existing_annotations.slice()); N::wrap(Annotations::new(Some(annotations)), v) } else { self.skip_annotations()?; self.demand_next(read_annotations)? } } Tag::Embedded => { Value::Embedded(self.decode_embedded.decode_embedded(self.source, read_annotations)?).wrap() } Tag::SmallInteger(v) => { // TODO: prebuild these in value.rs Value::from(v).wrap() } Tag::MediumInteger(count) => { let n = self.read_signed_integer(count.into())?; Value::SignedInteger(n).wrap() } Tag::SignedInteger => { let count = self.varint()?; let n = self.read_signed_integer(count)?; Value::SignedInteger(n).wrap() } Tag::String => { let count = self.varint()?; Value::String(decodestr(self.readbytes(count)?)?.into_owned()).wrap() } Tag::ByteString => { let count = self.varint()?; Value::ByteString(self.readbytes(count)?.into_owned()).wrap() } Tag::Symbol => { let count = self.varint()?; Value::Symbol(decodestr(self.readbytes(count)?)?.into_owned()).wrap() } Tag::Record => { let mut vs = Vec::new(); while let Some(v) = self.next_upto_end(read_annotations)? { vs.push(v); } if vs.is_empty() { return Err(io_syntax_error("Too few elements in encoded record")) } Value::Record(Record(vs)).wrap() } Tag::Sequence => { let mut vs = Vec::new(); while let Some(v) = self.next_upto_end(read_annotations)? { vs.push(v); } Value::Sequence(vs).wrap() } Tag::Set => { let mut s = Set::new(); while let Some(v) = self.next_upto_end(read_annotations)? { s.insert(v); } Value::Set(s).wrap() } Tag::Dictionary => { let mut d = Map::new(); while let Some(k) = self.next_upto_end(read_annotations)? { match self.next_upto_end(read_annotations)? { Some(v) => { d.insert(k, v); } None => return Err(io_syntax_error("Missing dictionary value")), } } Value::Dictionary(d).wrap() } tag @ Tag::End => { return Err(io_syntax_error(&format!("Invalid tag: {:?}", tag))); } })) } fn open_record(&mut self, arity: Option) -> ReaderResult<()> { self.next_compound(Tag::Record, ExpectedKind::Record(arity))?; self.ensure_more_expected() } fn open_sequence_or_set(&mut self) -> ReaderResult<()> { match self.peek_next_nonannotation_tag()? { Tag::Sequence | Tag::Set => { self.skip()?; Ok(()) } _ => Err(self.expected(ExpectedKind::SequenceOrSet)), } } fn open_sequence(&mut self) -> ReaderResult<()> { self.next_compound(Tag::Sequence, ExpectedKind::Sequence) } fn open_set(&mut self) -> ReaderResult<()> { self.next_compound(Tag::Set, ExpectedKind::Set) } fn open_dictionary(&mut self) -> ReaderResult<()> { self.next_compound(Tag::Dictionary, ExpectedKind::Dictionary) } fn close_compound(&mut self) -> ReaderResult { Ok(self.peekend()?) } fn open_embedded(&mut self) -> ReaderResult<()> { self.next_compound(Tag::Embedded, ExpectedKind::Embedded) } fn close_embedded(&mut self) -> ReaderResult<()> { Ok(()) } type Mark = S::Mark; fn mark(&mut self) -> io::Result { self.source.mark() } fn restore(&mut self, mark: &Self::Mark) -> io::Result<()> { self.source.restore(mark) } fn next_token(&mut self, read_embedded_annotations: bool) -> io::Result> { loop { return Ok(match Tag::try_from(self.peek()?)? { Tag::Embedded => { self.skip()?; Token::Embedded(self.decode_embedded.decode_embedded( self.source, read_embedded_annotations)?) } Tag::False | Tag::True | Tag::Float | Tag::Double | Tag::SmallInteger(_) | Tag::MediumInteger(_) | Tag::SignedInteger | Tag::String | Tag::ByteString | Tag::Symbol => Token::Atom(self.demand_next(false)?), Tag::Record => { self.skip()?; Token::Compound(CompoundClass::Record) } Tag::Sequence => { self.skip()?; Token::Compound(CompoundClass::Sequence) } Tag::Set => { self.skip()?; Token::Compound(CompoundClass::Set) } Tag::Dictionary => { self.skip()?; Token::Compound(CompoundClass::Dictionary) } Tag::End => { self.skip()?; Token::End } Tag::Annotation => { self.skip()?; self.skip_annotations()?; continue } }) } } fn next_annotations_and_token(&mut self) -> io::Result<(Vec, Token)> { match Tag::try_from(self.peek()?)? { Tag::Annotation => { self.skip()?; let annotations = self.gather_annotations()?; Ok((annotations, self.next_token(true)?)) } _ => Ok((Vec::new(), self.next_token(true)?)), } } fn next_boolean(&mut self) -> ReaderResult { match self.peek_next_nonannotation_tag()? { Tag::False => { self.skip()?; Ok(false) } Tag::True => { self.skip()?; Ok(true) } _ => Err(self.expected(ExpectedKind::Boolean)), } } fn next_signedinteger(&mut self) -> ReaderResult { let tag = self.peek_next_nonannotation_tag()?; match tag { Tag::SmallInteger(v) => { self.skip()?; Ok(SignedInteger::from(v as i32)) } Tag::MediumInteger(count) => { self.skip()?; Ok(self.read_signed_integer(count.into())?) } Tag::SignedInteger => { self.skip()?; let count = self.varint()?; Ok(self.read_signed_integer(count)?) } _ => Err(self.expected(ExpectedKind::SignedInteger)) } } fn next_i8(&mut self) -> ReaderResult { self.next_signed(|n| n.to_i8()) } fn next_i16(&mut self) -> ReaderResult { self.next_signed(|n| n.to_i16()) } fn next_i32(&mut self) -> ReaderResult { self.next_signed(|n| n.to_i32()) } fn next_i64(&mut self) -> ReaderResult { self.next_signed(|n| n.to_i64()) } fn next_i128(&mut self) -> ReaderResult { self.next_signed(|n| n.to_i128()) } fn next_u8(&mut self) -> ReaderResult { self.next_unsigned(|n| n.to_u8()) } fn next_u16(&mut self) -> ReaderResult { self.next_unsigned(|n| n.to_u16()) } fn next_u32(&mut self) -> ReaderResult { self.next_unsigned(|n| n.to_u32()) } fn next_u64(&mut self) -> ReaderResult { self.next_unsigned(|n| n.to_u64()) } fn next_u128(&mut self) -> ReaderResult { self.next_unsigned(|n| n.to_u128()) } fn next_f32(&mut self) -> ReaderResult { match self.peek_next_nonannotation_tag()? { Tag::Float => { self.skip()?; let mut bs = [0; 4]; self.readbytes_into(&mut bs)?; Ok(f32::from_bits(u32::from_be_bytes(bs))) }, Tag::Double => { self.skip()?; let mut bs = [0; 8]; self.readbytes_into(&mut bs)?; Ok(f64::from_bits(u64::from_be_bytes(bs)) as f32) }, _ => Err(self.expected(ExpectedKind::Float)), } } fn next_f64(&mut self) -> ReaderResult { match self.peek_next_nonannotation_tag()? { Tag::Float => { self.skip()?; let mut bs = [0; 4]; self.readbytes_into(&mut bs)?; Ok(f32::from_bits(u32::from_be_bytes(bs)) as f64) }, Tag::Double => { self.skip()?; let mut bs = [0; 8]; self.readbytes_into(&mut bs)?; Ok(f64::from_bits(u64::from_be_bytes(bs))) }, _ => Err(self.expected(ExpectedKind::Double)), } } fn next_str(&mut self) -> ReaderResult> { Ok(decodestr(self.next_atomic(Tag::String, ExpectedKind::Symbol)?)?) } fn next_bytestring(&mut self) -> ReaderResult> { self.next_atomic(Tag::ByteString, ExpectedKind::Symbol) } fn next_symbol(&mut self) -> ReaderResult> { Ok(decodestr(self.next_atomic(Tag::Symbol, ExpectedKind::Symbol)?)?) } } fn decodestr(cow: Cow<'_, [u8]>) -> io::Result> { match cow { Cow::Borrowed(bs) => Ok(Cow::Borrowed(std::str::from_utf8(bs).map_err(|_| io_syntax_error("Invalid UTF-8"))?)), Cow::Owned(bs) => Ok(Cow::Owned(String::from_utf8(bs).map_err(|_| io_syntax_error("Invalid UTF-8"))?)), } }