use super::symbol;
use crate::bit;
use crate::lz77;
use rle_decode_fast::rle_decode;
use std::cmp;
use std::io;
use std::io::Read;
#[derive(Debug)]
pub struct Decoder<R> {
bit_reader: bit::BitReader<R>,
buffer: Vec<u8>,
offset: usize,
eos: bool,
}
impl<R> Decoder<R>
where
R: Read,
{
pub fn new(inner: R) -> Self {
Decoder {
bit_reader: bit::BitReader::new(inner),
buffer: Vec::new(),
offset: 0,
eos: false,
}
}
pub fn as_inner_ref(&self) -> &R {
self.bit_reader.as_inner_ref()
}
pub fn as_inner_mut(&mut self) -> &mut R {
self.bit_reader.as_inner_mut()
}
pub fn into_inner(self) -> R {
self.bit_reader.into_inner()
}
pub(crate) fn reset(&mut self) {
self.bit_reader.reset();
self.buffer.clear();
self.offset = 0;
self.eos = false
}
fn read_non_compressed_block(&mut self) -> io::Result<()> {
self.bit_reader.reset();
let mut buf = [0; 2];
self.bit_reader.as_inner_mut().read_exact(&mut buf)?;
let len = u16::from_le_bytes(buf);
self.bit_reader.as_inner_mut().read_exact(&mut buf)?;
let nlen = u16::from_le_bytes(buf);
if !len != nlen {
Err(invalid_data_error!(
"LEN={} is not the one's complement of NLEN={}",
len,
nlen
))
} else {
self.bit_reader
.as_inner_mut()
.take(len.into())
.read_to_end(&mut self.buffer)
.and_then(|used| {
if used != len.into() {
Err(io::Error::new(
io::ErrorKind::UnexpectedEof,
format!(
"The reader has incorrect length: expected {}, read {}",
len, used
),
))
} else {
Ok(())
}
})
}
}
fn read_compressed_block<H>(&mut self, huffman: &H) -> io::Result<()>
where
H: symbol::HuffmanCodec,
{
let symbol_decoder = huffman.load(&mut self.bit_reader)?;
loop {
let s = symbol_decoder.decode_unchecked(&mut self.bit_reader);
self.bit_reader.check_last_error()?;
match s {
symbol::Symbol::Literal(b) => {
self.buffer.push(b);
}
symbol::Symbol::Share { length, distance } => {
if self.buffer.len() < distance as usize {
return Err(invalid_data_error!(
"Too long backword reference: buffer.len={}, distance={}",
self.buffer.len(),
distance
));
}
rle_decode(&mut self.buffer, usize::from(distance), usize::from(length));
}
symbol::Symbol::EndOfBlock => {
break;
}
}
}
Ok(())
}
fn truncate_old_buffer(&mut self) {
if self.buffer.len() > lz77::MAX_DISTANCE as usize * 4 {
let old_len = self.buffer.len();
let new_len = lz77::MAX_DISTANCE as usize;
{
let (dst, src) = self.buffer.split_at_mut(old_len - new_len);
dst[..new_len].copy_from_slice(src);
}
self.buffer.truncate(new_len);
self.offset = new_len;
}
}
}
impl<R> Read for Decoder<R>
where
R: Read,
{
fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> {
if self.offset < self.buffer.len() {
let copy_size = cmp::min(buf.len(), self.buffer.len() - self.offset);
buf[..copy_size].copy_from_slice(&self.buffer[self.offset..][..copy_size]);
self.offset += copy_size;
Ok(copy_size)
} else if self.eos {
Ok(0)
} else {
let bfinal = self.bit_reader.read_bit()?;
let btype = self.bit_reader.read_bits(2)?;
self.eos = bfinal;
self.truncate_old_buffer();
match btype {
0b00 => {
self.read_non_compressed_block()?;
self.read(buf)
}
0b01 => {
self.read_compressed_block(&symbol::FixedHuffmanCodec)?;
self.read(buf)
}
0b10 => {
self.read_compressed_block(&symbol::DynamicHuffmanCodec)?;
self.read(buf)
}
0b11 => Err(invalid_data_error!(
"btype 0x11 of DEFLATE is reserved(error) value"
)),
_ => unreachable!(),
}
}
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::deflate::symbol::{DynamicHuffmanCodec, HuffmanCodec};
use std::io;
#[test]
fn test_issues_3() {
let input = [
180, 253, 73, 143, 28, 201, 150, 46, 8, 254, 150, 184, 139, 75, 18, 69, 247, 32, 157,
51, 27, 141, 132, 207, 78, 210, 167, 116, 243, 160, 223, 136, 141, 66, 205, 76, 221,
76, 195, 213, 84, 236, 234, 224, 78, 227, 34, 145, 221, 139, 126, 232, 69, 173, 170,
208, 192, 219, 245, 67, 3, 15, 149, 120, 171, 70, 53, 106, 213, 175, 23, 21, 153, 139,
254, 27, 249, 75, 234, 124, 71, 116, 56, 71, 68, 212, 204, 121, 115, 64, 222, 160, 203,
119, 142, 170, 169, 138, 202, 112, 228, 140, 38,
];
let mut bit_reader = crate::bit::BitReader::new(&input[..]);
assert_eq!(bit_reader.read_bit().unwrap(), false);
assert_eq!(bit_reader.read_bits(2).unwrap(), 0b10);
DynamicHuffmanCodec.load(&mut bit_reader).unwrap();
}
#[test]
fn it_works() {
let input = [
180, 253, 73, 143, 28, 201, 150, 46, 8, 254, 150, 184, 139, 75, 18, 69, 247, 32, 157,
51, 27, 141, 132, 207, 78, 210, 167, 116, 243, 160, 223, 136, 141, 66, 205, 76, 221,
76, 195, 213, 84, 236, 234, 224, 78, 227, 34, 145, 221, 139, 126, 232, 69, 173, 170,
208, 192, 219, 245, 67, 3, 15, 149, 120, 171, 70, 53, 106, 213, 175, 23, 21, 153, 139,
254, 27, 249, 75, 234, 124, 71, 116, 56, 71, 68, 212, 204, 121, 115, 64, 222, 160, 203,
119, 142, 170, 169, 138, 202, 112, 228, 140, 38, 171, 162, 88, 212, 235, 56, 136, 231,
233, 239, 113, 249, 163, 252, 16, 42, 138, 49, 226, 108, 73, 28, 153,
];
let mut decoder = Decoder::new(&input[..]);
let result = io::copy(&mut decoder, &mut io::sink());
assert!(result.is_err());
let error = result.err().unwrap();
assert_eq!(error.kind(), io::ErrorKind::InvalidData);
assert!(error.to_string().starts_with("Too long backword reference"));
}
}