mirror of
https://github.com/trezor/trezor-firmware.git
synced 2025-01-10 07:20:56 +00:00
80d1ce25c6
[no changelog]
1446 lines
55 KiB
Rust
1446 lines
55 KiB
Rust
/*----------------------------------------------------------------------------/
|
|
/ TJpgDec - Tiny JPEG Decompressor R0.03+trezor (C)ChaN, 2021
|
|
/-----------------------------------------------------------------------------/
|
|
/ The TJpgDec is a generic JPEG decompressor module for tiny embedded systems.
|
|
/ This is a free software that opened for education, research and commercial
|
|
/ developments under license policy of following terms.
|
|
/
|
|
/ Copyright (C) 2021, ChaN, all right reserved.
|
|
/
|
|
/ * The TJpgDec module is a free software and there is NO WARRANTY.
|
|
/ * No restriction on use. You can use, modify and redistribute it for
|
|
/ personal, non-profit or commercial products UNDER YOUR RESPONSIBILITY.
|
|
/ * Redistributions of source code must retain the above copyright notice.
|
|
/
|
|
/-----------------------------------------------------------------------------/
|
|
/ Oct 04, 2011 R0.01 First release.
|
|
/ Feb 19, 2012 R0.01a Fixed decompression fails when scan starts with an escape seq.
|
|
/ Sep 03, 2012 R0.01b Added JD_TBLCLIP option.
|
|
/ Mar 16, 2019 R0.01c Supprted stdint.h.
|
|
/ Jul 01, 2020 R0.01d Fixed wrong integer type usage.
|
|
/ May 08, 2021 R0.02 Supprted grayscale image. Separated configuration options.
|
|
/ Jun 11, 2021 R0.02a Some performance improvement.
|
|
/ Jul 01, 2021 R0.03 Added JD_FASTDECODE option.
|
|
/ Some performance improvement.
|
|
/ Jan 02, 2023 Rust version by Trezor Company, modified to meet our needs.
|
|
/ May 14, 2024 Added better support for decompression resuming after an
|
|
/ output function interruption.
|
|
Trezor modifications:
|
|
- included overflow detection from https://github.com/cmumford/TJpgDec
|
|
- removed JD_FASTDECODE=0 option
|
|
- removed JD_TBLCLIP option
|
|
- allowed interrupted functionality
|
|
- tighter integration into Trezor codebase by using our data structures
|
|
- removed generic input and output functions, replaced by our specific functionality
|
|
- added better support for decompression resuming after an output function interruption
|
|
/----------------------------------------------------------------------------*/
|
|
|
|
#![no_std]
|
|
|
|
use core::{
|
|
f64::consts::{FRAC_1_SQRT_2, SQRT_2},
|
|
mem, slice,
|
|
};
|
|
|
|
/// Specifies output pixel format.
|
|
/// 0: RGB888 (24-bit/pix)
|
|
/// 1: RGB565 (16-bit/pix)
|
|
/// 2: Grayscale (8-bit/pix)
|
|
const JD_FORMAT: u32 = 1;
|
|
|
|
/// Switches output descaling feature.
|
|
/// 0: Disable
|
|
/// 1: Enable
|
|
const JD_USE_SCALE: u32 = 1;
|
|
|
|
/// Optimization level
|
|
/// 0: NOT IMPLEMENTED Basic optimization. Suitable for 8/16-bit MCUs.
|
|
/// 1: + 32-bit barrel shifter. Suitable for 32-bit MCUs.
|
|
/// 2: + Table conversion for huffman decoding (wants 6 << HUFF_BIT bytes of
|
|
/// RAM)
|
|
const JD_FASTDECODE: u32 = 2;
|
|
|
|
/// Specifies size of stream input buffer
|
|
const JD_SZBUF: usize = 512;
|
|
|
|
const HUFF_BIT: u32 = 10;
|
|
const HUFF_LEN: u32 = 1 << HUFF_BIT;
|
|
const HUFF_MASK: u32 = HUFF_LEN - 1;
|
|
|
|
const NUM_DEQUANTIZER_TABLES: usize = 4;
|
|
|
|
#[derive(PartialEq, Eq)]
|
|
pub enum Error {
|
|
/// Interrupted by output function, call `JDEC::decomp` to continue.
|
|
Interrupted,
|
|
/// Device error or wrong termination of input stream.
|
|
Input,
|
|
/// Insufficient memory pool for the image.
|
|
MemoryPool,
|
|
/// Insufficient stream input buffer.
|
|
MemoryInput,
|
|
/// Parameter error.
|
|
Parameter,
|
|
/// Data format error (may be broken data).
|
|
InvalidData,
|
|
/// Not supported JPEG standard.
|
|
UnsupportedJpeg,
|
|
}
|
|
|
|
pub struct JDEC<'p> {
|
|
dctr: usize,
|
|
dptr: usize,
|
|
inbuf: &'p mut [u8],
|
|
dbit: u8,
|
|
scale: u8,
|
|
msx: u8,
|
|
msy: u8,
|
|
qtid: [u8; 3],
|
|
ncomp: u8,
|
|
dcv: [i16; 3],
|
|
nrst: u16,
|
|
rst: u16,
|
|
rsc: u16,
|
|
width: u16,
|
|
height: u16,
|
|
huffbits: [[&'p mut [u8]; 2]; 2],
|
|
huffcode: [[&'p mut [u16]; 2]; 2],
|
|
huffcode_len: [[usize; 2]; 2],
|
|
huffdata: [[&'p mut [u8]; 2]; 2],
|
|
qttbl: [&'p mut [i32]; 4],
|
|
wreg: u32,
|
|
marker: u8,
|
|
longofs: [[u8; 2]; 2],
|
|
hufflut_ac: [&'p mut [u16]; 2],
|
|
hufflut_dc: [&'p mut [u8]; 2],
|
|
workbuf: &'p mut [i32],
|
|
mcubuf: &'p mut [i16],
|
|
mcu_x: u16,
|
|
mcu_y: u16,
|
|
pool: &'p mut [u8],
|
|
}
|
|
|
|
/// Zigzag-order to raster-order conversion table
|
|
#[rustfmt::skip]
|
|
const ZIG: [u8; 64] = [
|
|
0, 1, 8, 16, 9, 2, 3, 10, 17, 24, 32, 25, 18, 11, 4, 5,
|
|
12, 19, 26, 33, 40, 48, 41, 34, 27, 20, 13, 6, 7, 14, 21, 28,
|
|
35, 42, 49, 56, 57, 50, 43, 36, 29, 22, 15, 23, 30, 37, 44, 51,
|
|
58, 59, 52, 45, 38, 31, 39, 46, 53, 60, 61, 54, 47, 55, 62, 63,
|
|
];
|
|
|
|
macro_rules! f {
|
|
($num:expr) => {{
|
|
($num * 8192_f64) as u16
|
|
}};
|
|
}
|
|
|
|
/// Input scale factor of Arai algorithm
|
|
/// (scaled up 16 bits for fixed point operations)
|
|
#[rustfmt::skip]
|
|
const IPSF: [u16; 64] = [
|
|
f!(1.00000), f!(1.38704), f!(1.30656), f!(1.17588), f!(1.00000), f!(0.78570), f!(0.54120), f!(0.27590),
|
|
f!(1.38704), f!(1.92388), f!(1.81226), f!(1.63099), f!(1.38704), f!(1.08979), f!(0.75066), f!(0.38268),
|
|
f!(1.30656), f!(1.81226), f!(1.70711), f!(1.53636), f!(1.30656), f!(1.02656), f!(FRAC_1_SQRT_2), f!(0.36048),
|
|
f!(1.17588), f!(1.63099), f!(1.53636), f!(1.38268), f!(1.17588), f!(0.92388), f!(0.63638), f!(0.32442),
|
|
f!(1.00000), f!(1.38704), f!(1.30656), f!(1.17588), f!(1.00000), f!(0.78570), f!(0.54120), f!(0.27590),
|
|
f!(0.78570), f!(1.08979), f!(1.02656), f!(0.92388), f!(0.78570), f!(0.61732), f!(0.42522), f!(0.21677),
|
|
f!(0.54120), f!(0.75066), f!(FRAC_1_SQRT_2), f!(0.63638), f!(0.54120), f!(0.42522), f!(0.29290), f!(0.14932),
|
|
f!(0.27590), f!(0.38268), f!(0.36048), f!(0.32442), f!(0.27590), f!(0.21678), f!(0.14932), f!(0.07612),
|
|
];
|
|
|
|
impl<'p> JDEC<'p> {
|
|
/// Allocate a memory block from memory pool
|
|
/// `self`: decompressor object reference
|
|
/// `ndata` number of `T` items to allocate
|
|
fn alloc_slice<T>(&mut self, ndata: usize) -> Result<&'p mut [T], Error> {
|
|
let ndata_bytes = ndata * mem::size_of::<T>();
|
|
let ndata_aligned = (ndata_bytes + 3) & !3;
|
|
if self.pool.len() < ndata_aligned {
|
|
// Err: not enough memory
|
|
return Err(Error::MemoryPool);
|
|
}
|
|
|
|
// SAFETY:
|
|
// - Memory is valid because it comes from a valid slice.
|
|
// - Memory is initialized because here we consider integers always
|
|
// initialized.
|
|
// - The slices do not overlap and the original reference is overwritten,
|
|
// ensuring that the returned references are exclusive.
|
|
unsafe {
|
|
let data = slice::from_raw_parts_mut(self.pool.as_mut_ptr() as _, ndata);
|
|
let newpool = slice::from_raw_parts_mut(
|
|
self.pool.as_mut_ptr().add(ndata_aligned),
|
|
self.pool.len() - ndata_aligned,
|
|
);
|
|
self.pool = newpool;
|
|
Ok(data)
|
|
}
|
|
}
|
|
|
|
fn jpeg_in(&mut self, inbuf_offset: Option<usize>, n_data: usize, input_func: &mut dyn JpegInput) -> usize {
|
|
if let Some(offset) = inbuf_offset {
|
|
let inbuf = &mut self.inbuf[offset..offset + n_data];
|
|
input_func.read(Some(inbuf), n_data)
|
|
} else {
|
|
input_func.read(None, n_data)
|
|
}
|
|
}
|
|
|
|
/// Create de-quantization and prescaling tables with a DQT segment
|
|
/// `self`: decompressor object reference
|
|
/// `ndata`: size of input data
|
|
fn create_qt_tbl(&mut self, mut ndata: usize) -> Result<(), Error> {
|
|
let mut i: u32;
|
|
let mut d: u8;
|
|
let mut data_idx = 0;
|
|
while ndata != 0 {
|
|
// Process all tables in the segment
|
|
if ndata < 65 {
|
|
// Err: table size is unaligned
|
|
return Err(Error::InvalidData);
|
|
}
|
|
ndata -= 65;
|
|
|
|
d = self.inbuf[data_idx]; // Get table property
|
|
data_idx += 1;
|
|
if d & 0xf0 != 0 {
|
|
// Err: not 8-bit resolution
|
|
return Err(Error::InvalidData);
|
|
}
|
|
i = (d & 3) as u32; // Get table ID
|
|
|
|
// Allocate a memory block for the table
|
|
// Register the table
|
|
self.qttbl[i as usize] = self.alloc_slice(64)?;
|
|
for zi in ZIG {
|
|
// Load the table
|
|
// Apply scale factor of Arai algorithm to the de-quantizers
|
|
self.qttbl[i as usize][zi as usize] =
|
|
((self.inbuf[data_idx] as u32) * IPSF[zi as usize] as u32) as i32;
|
|
data_idx += 1;
|
|
}
|
|
}
|
|
Ok(())
|
|
}
|
|
|
|
/// Create huffman code tables with a DHT segment
|
|
/// `self`: decompressor object reference
|
|
/// `ndata`: size of input data
|
|
fn create_huffman_tbl(&mut self, mut ndata: usize) -> Result<(), Error> {
|
|
let mut j: u32;
|
|
let mut b: u32;
|
|
let mut cls: usize;
|
|
let mut num: usize;
|
|
let mut np: usize;
|
|
let mut d: u8;
|
|
let mut hc: u16;
|
|
let mut data_idx = 0;
|
|
while ndata != 0 {
|
|
// Process all tables in the segment
|
|
if ndata < 17 {
|
|
// Err: wrong data size
|
|
return Err(Error::InvalidData);
|
|
}
|
|
ndata -= 17;
|
|
d = self.inbuf[data_idx]; // Get table number and class
|
|
data_idx += 1;
|
|
if d & 0xee != 0 {
|
|
// Err: invalid class/number
|
|
return Err(Error::InvalidData);
|
|
}
|
|
cls = d as usize >> 4; // class = dc(0)/ac(1)
|
|
num = d as usize & 0xf; // table number = 0/1
|
|
// Allocate a memory block for the bit distribution table
|
|
self.huffbits[num][cls] = self.alloc_slice(16)?;
|
|
|
|
np = 0;
|
|
for i in 0..16 {
|
|
// Load number of patterns for 1 to 16-bit code
|
|
// Get sum of code words for each code
|
|
self.huffbits[num][cls][i] = self.inbuf[data_idx];
|
|
np += self.inbuf[data_idx] as usize;
|
|
data_idx += 1;
|
|
}
|
|
// Allocate a memory block for the code word table
|
|
self.huffcode[num][cls] = self.alloc_slice(np)?;
|
|
self.huffcode_len[num][cls] = np;
|
|
|
|
// Re-build huffman code word table
|
|
hc = 0;
|
|
j = 0;
|
|
for i in 0..16 {
|
|
b = self.huffbits[num][cls][i] as u32;
|
|
while b > 0 {
|
|
self.huffcode[num][cls][j as usize] = hc;
|
|
hc += 1;
|
|
j += 1;
|
|
b -= 1;
|
|
}
|
|
hc <<= 1;
|
|
}
|
|
if ndata < np {
|
|
// Err: wrong data size
|
|
return Err(Error::InvalidData);
|
|
}
|
|
ndata -= np;
|
|
|
|
// Allocate a memory block for the decoded data
|
|
self.huffdata[num][cls] = self.alloc_slice(np)?;
|
|
|
|
// Load decoded data corresponds to each code word
|
|
for i in 0..np {
|
|
d = self.inbuf[data_idx];
|
|
data_idx += 1;
|
|
if cls == 0 && d > 11 {
|
|
return Err(Error::InvalidData);
|
|
}
|
|
self.huffdata[num][cls][i] = d;
|
|
}
|
|
if JD_FASTDECODE == 2 {
|
|
// Create fast huffman decode table
|
|
let mut span: u32;
|
|
let mut td: u32;
|
|
let mut ti: u32;
|
|
if cls != 0 {
|
|
// LUT for AC elements
|
|
self.hufflut_ac[num] = self.alloc_slice(HUFF_LEN as usize)?;
|
|
// Default value (0xFFFF: may be long code)
|
|
self.hufflut_ac[num].fill(0xffff);
|
|
} else {
|
|
// LUT for DC elements
|
|
self.hufflut_dc[num] = self.alloc_slice(HUFF_LEN as usize)?;
|
|
// Default value (0xFF: may be long code)
|
|
self.hufflut_dc[num].fill(0xff);
|
|
}
|
|
let mut i = 0;
|
|
|
|
// Create LUT
|
|
for b in 0..HUFF_BIT {
|
|
j = self.huffbits[num][cls][b as usize] as u32;
|
|
while j != 0 {
|
|
// Index of input pattern for the code
|
|
ti =
|
|
(self.huffcode[num][cls][i] << ((HUFF_BIT - 1) - b)) as u32 & HUFF_MASK;
|
|
|
|
if cls != 0 {
|
|
// b15..b8: code length, b7..b0: zero run and data length
|
|
td = self.huffdata[num][cls][i] as u32 | (b + 1) << 8;
|
|
i += 1;
|
|
span = 1 << ((HUFF_BIT - 1) - b);
|
|
while span != 0 {
|
|
span -= 1;
|
|
self.hufflut_ac[num][ti as usize] = td as u16;
|
|
ti += 1;
|
|
}
|
|
} else {
|
|
// b7..b4: code length, b3..b0: data length
|
|
td = self.huffdata[num][cls][i] as u32 | (b + 1) << 4;
|
|
i += 1;
|
|
span = 1 << ((HUFF_BIT - 1) - b);
|
|
while span != 0 {
|
|
span -= 1;
|
|
self.hufflut_dc[num][ti as usize] = td as u8;
|
|
ti += 1;
|
|
}
|
|
}
|
|
j -= 1;
|
|
}
|
|
}
|
|
// Code table offset for long code
|
|
self.longofs[num][cls] = i as u8;
|
|
}
|
|
}
|
|
Ok(())
|
|
}
|
|
|
|
/// Extract a huffman decoded data from input stream
|
|
/// `self`: decompressor object reference
|
|
/// `id`: table ID (0:Y, 1:C)
|
|
/// `cls`: table class (0:DC, 1:AC)
|
|
fn huffext(&mut self, id: usize, cls: usize, input_func: &mut dyn JpegInput) -> Result<i32, Error> {
|
|
let mut dc: usize = self.dctr;
|
|
let mut dp: usize = self.dptr;
|
|
let mut d: u32;
|
|
let mut flg: u32 = 0;
|
|
let mut nc: u32;
|
|
let mut bl: u32;
|
|
let mut wbit: u32 = (self.dbit as i32 % 32) as u32;
|
|
let mut w: u32 = self.wreg & ((1 << wbit) - 1);
|
|
while wbit < 16 {
|
|
// Prepare 16 bits into the working register
|
|
if self.marker != 0 {
|
|
d = 0xff; // Input stream has stalled for a marker. Generate
|
|
// stuff bits
|
|
} else {
|
|
if dc == 0 {
|
|
// Buffer empty, re-fill input buffer
|
|
dp = 0; // Top of input buffer
|
|
dc = self.jpeg_in(Some(0), JD_SZBUF, input_func);
|
|
if dc == 0 {
|
|
// Err: read error or wrong stream termination
|
|
return Err(Error::Input);
|
|
}
|
|
}
|
|
d = self.inbuf[dp] as u32;
|
|
dp += 1;
|
|
|
|
dc -= 1;
|
|
if flg != 0 {
|
|
// In flag sequence?
|
|
flg = 0; // Exit flag sequence
|
|
if d != 0 {
|
|
// Not an escape of 0xFF but a marker
|
|
self.marker = d as u8;
|
|
}
|
|
d = 0xff;
|
|
} else if d == 0xff {
|
|
// Is start of flag sequence?
|
|
// Enter flag sequence, get trailing byte
|
|
flg = 1;
|
|
continue;
|
|
}
|
|
}
|
|
// Shift 8 bits in the working register
|
|
w = w << 8 | d;
|
|
wbit += 8;
|
|
}
|
|
self.dctr = dc;
|
|
self.dptr = dp;
|
|
self.wreg = w;
|
|
|
|
let mut hb_idx = 0;
|
|
let mut hc_idx = 0;
|
|
let mut hd_idx = 0;
|
|
|
|
if JD_FASTDECODE == 2 {
|
|
// Table serch for the short codes
|
|
d = w >> (wbit - HUFF_BIT); // Short code as table index
|
|
if cls != 0 {
|
|
// AC element
|
|
d = self.hufflut_ac[id][d as usize] as u32; // Table decode
|
|
if d != 0xffff {
|
|
// It is done if hit in short code
|
|
self.dbit = (wbit - (d >> 8)) as u8; // Snip the code length
|
|
return Ok((d & 0xff) as i32); // b7..0: zero run and
|
|
// following
|
|
// data bits
|
|
}
|
|
} else {
|
|
// DC element
|
|
d = self.hufflut_dc[id][d as usize] as u32; // Table decode
|
|
if d != 0xff {
|
|
// It is done if hit in short code
|
|
self.dbit = (wbit - (d >> 4)) as u8; // Snip the code length
|
|
return Ok((d & 0xf) as i32); // b3..0: following data bits
|
|
}
|
|
}
|
|
|
|
// Incremental serch for the codes longer than HUFF_BIT
|
|
hb_idx = HUFF_BIT; // Bit distribution table
|
|
hc_idx = self.longofs[id][cls]; // Code word table
|
|
hd_idx = self.longofs[id][cls]; // Data table
|
|
bl = HUFF_BIT + 1;
|
|
} else {
|
|
// Incremental search for all codes
|
|
bl = 1;
|
|
}
|
|
|
|
// Incremental search
|
|
while bl <= 16 {
|
|
nc = self.huffbits[id][cls][hb_idx as usize] as u32;
|
|
hb_idx += 1;
|
|
if nc != 0 {
|
|
d = w >> (wbit - bl);
|
|
loop {
|
|
// Search the code word in this bit length
|
|
if hc_idx as usize >= self.huffcode_len[id][cls] {
|
|
return Err(Error::InvalidData);
|
|
}
|
|
let val = self.huffcode[id][cls][hc_idx as usize];
|
|
if d == val as u32 {
|
|
// Matched?
|
|
self.dbit = (wbit - bl) as u8; // Snip the huffman code
|
|
// Return the decoded data
|
|
return Ok(self.huffdata[id][cls][hd_idx as usize] as i32);
|
|
}
|
|
hc_idx += 1;
|
|
hd_idx += 1;
|
|
nc -= 1;
|
|
if nc == 0 {
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
bl += 1;
|
|
}
|
|
|
|
// Err: code not found (may be collapted data)
|
|
Err(Error::InvalidData)
|
|
}
|
|
|
|
/// Extract N bits from input stream
|
|
/// `self`: decompressor object reference
|
|
/// `nbit`: number of bits to extract (1 to 16)
|
|
fn bitext(&mut self, nbit: u32, input_func: &mut dyn JpegInput) -> Result<i32, Error> {
|
|
let mut dc: usize = self.dctr;
|
|
let mut dp: usize = self.dptr;
|
|
let mut d: u32;
|
|
let mut flg: u32 = 0;
|
|
let mut wbit: u32 = (self.dbit as i32 % 32) as u32;
|
|
let mut w: u32 = self.wreg & ((1 << wbit) - 1);
|
|
while wbit < nbit {
|
|
// Prepare nbit bits into the working register
|
|
if self.marker != 0 {
|
|
d = 0xff; // Input stream stalled, generate stuff bits
|
|
} else {
|
|
if dc == 0 {
|
|
// Buffer empty, re-fill input buffer
|
|
dp = 0; // Top of input buffer
|
|
dc = self.jpeg_in(Some(0), JD_SZBUF, input_func);
|
|
if dc == 0 {
|
|
// Err: read error or wrong stream termination
|
|
return Err(Error::Input);
|
|
}
|
|
}
|
|
d = self.inbuf[dp] as u32;
|
|
dp += 1;
|
|
dc -= 1;
|
|
if flg != 0 {
|
|
// In flag sequence?
|
|
flg = 0; // Exit flag sequence
|
|
if d != 0 {
|
|
// Not an escape of 0xFF but a marker
|
|
self.marker = d as u8;
|
|
}
|
|
d = 0xff;
|
|
} else if d == 0xff {
|
|
// Is start of flag sequence?
|
|
flg = 1; // Enter flag sequence, get trailing byte
|
|
continue;
|
|
}
|
|
}
|
|
w = w << 8 | d;
|
|
wbit += 8;
|
|
}
|
|
self.wreg = w;
|
|
self.dbit = (wbit - nbit) as u8;
|
|
self.dctr = dc;
|
|
self.dptr = dp;
|
|
|
|
Ok((w >> ((wbit - nbit) % 32)) as i32)
|
|
}
|
|
|
|
/// Process restart interval
|
|
/// `self`: decompressor object reference
|
|
/// `rstn`: expected restart sequence number
|
|
fn restart(&mut self, rstn: u16, input_func: &mut dyn JpegInput) -> Result<(), Error> {
|
|
let mut dp = self.dptr;
|
|
let mut dc: usize = self.dctr;
|
|
let mut marker: u16;
|
|
if self.marker != 0 {
|
|
// Generate a maker if it has been detected
|
|
marker = 0xff00 | self.marker as u16;
|
|
self.marker = 0;
|
|
} else {
|
|
marker = 0;
|
|
for _ in 0..2 {
|
|
// Get a restart marker
|
|
if dc == 0 {
|
|
// No input data is available, re-fill input buffer
|
|
dp = 0;
|
|
dc = self.jpeg_in(Some(0), JD_SZBUF, input_func);
|
|
if dc == 0 {
|
|
return Err(Error::Input);
|
|
}
|
|
}
|
|
// Get a byte
|
|
let b = self.inbuf[dp] as u16;
|
|
marker = marker << 8 | b;
|
|
dp += 1;
|
|
dc -= 1;
|
|
}
|
|
self.dptr = dp;
|
|
self.dctr = dc;
|
|
}
|
|
|
|
// Check the marker
|
|
if marker & 0xffd8 != 0xffd0 || marker & 7 != rstn & 7 {
|
|
// Err: expected RSTn marker was not detected (may be collapted data)
|
|
return Err(Error::InvalidData);
|
|
}
|
|
self.dbit = 0; // Discard stuff bits
|
|
// Reset DC offset
|
|
self.dcv[0] = 0;
|
|
self.dcv[1] = 0;
|
|
self.dcv[2] = 0;
|
|
Ok(())
|
|
}
|
|
|
|
/// Apply Inverse-DCT in Arai Algorithm
|
|
/// `src`: input block data (de-quantized and pre-scaled for Arai Algorithm)
|
|
/// `dst`: destination to store the block as byte array
|
|
fn block_idct(src: &mut [i32], dst: &mut [i16]) {
|
|
let m13: i32 = (SQRT_2 * 4096_f64) as i32;
|
|
let m2: i32 = (1.08239f64 * 4096_f64) as i32;
|
|
let m4: i32 = (2.61313f64 * 4096_f64) as i32;
|
|
let m5: i32 = (1.84776f64 * 4096_f64) as i32;
|
|
let mut v0: i32;
|
|
let mut v1: i32;
|
|
let mut v2: i32;
|
|
let mut v3: i32;
|
|
let mut v4: i32;
|
|
let mut v5: i32;
|
|
let mut v6: i32;
|
|
let mut v7: i32;
|
|
let mut t10: i32;
|
|
let mut t11: i32;
|
|
let mut t12: i32;
|
|
let mut t13: i32;
|
|
|
|
// Process columns
|
|
for idx in 0..8 {
|
|
// Get even elements
|
|
v0 = src[idx];
|
|
v1 = src[idx + 8 * 2];
|
|
v2 = src[idx + 8 * 4];
|
|
v3 = src[idx + 8 * 6];
|
|
|
|
// Process the even elements
|
|
t10 = v0 + v2;
|
|
t12 = v0 - v2;
|
|
t11 = ((v1 - v3) * m13) >> 12;
|
|
v3 += v1;
|
|
t11 -= v3;
|
|
v0 = t10 + v3;
|
|
v3 = t10 - v3;
|
|
v1 = t11 + t12;
|
|
v2 = t12 - t11;
|
|
|
|
// Get odd elements
|
|
v4 = src[idx + 8 * 7];
|
|
v5 = src[idx + 8];
|
|
v6 = src[idx + 8 * 5];
|
|
v7 = src[idx + 8 * 3];
|
|
|
|
// Process the odd elements
|
|
t10 = v5 - v4;
|
|
t11 = v5 + v4;
|
|
t12 = v6 - v7;
|
|
v7 += v6;
|
|
v5 = ((t11 - v7) * m13) >> 12;
|
|
v7 += t11;
|
|
t13 = ((t10 + t12) * m5) >> 12;
|
|
v4 = t13 - ((t10 * m2) >> 12);
|
|
v6 = t13 - ((t12 * m4) >> 12) - v7;
|
|
v5 -= v6;
|
|
v4 -= v5;
|
|
|
|
// Write-back transformed values
|
|
src[idx] = v0 + v7;
|
|
src[idx + 8 * 7] = v0 - v7;
|
|
src[idx + 8] = v1 + v6;
|
|
src[idx + 8 * 6] = v1 - v6;
|
|
src[idx + 8 * 2] = v2 + v5;
|
|
src[idx + 8 * 5] = v2 - v5;
|
|
src[idx + 8 * 3] = v3 + v4;
|
|
src[idx + 8 * 4] = v3 - v4;
|
|
}
|
|
|
|
// Process rows
|
|
for idx in (0..64).step_by(8) {
|
|
// Get even elements
|
|
v0 = src[idx] + (128 << 8); // remove DC offset (-128) here
|
|
v1 = src[idx + 2];
|
|
v2 = src[idx + 4];
|
|
v3 = src[idx + 6];
|
|
|
|
// Process the even elements
|
|
t10 = v0 + v2;
|
|
t12 = v0 - v2;
|
|
t11 = ((v1 - v3) * m13) >> 12;
|
|
v3 += v1;
|
|
t11 -= v3;
|
|
v0 = t10 + v3;
|
|
v3 = t10 - v3;
|
|
v1 = t11 + t12;
|
|
v2 = t12 - t11;
|
|
|
|
// Get odd elements
|
|
v4 = src[idx + 7];
|
|
v5 = src[idx + 1];
|
|
v6 = src[idx + 5];
|
|
v7 = src[idx + 3];
|
|
|
|
// Process the odd elements
|
|
t10 = v5 - v4;
|
|
t11 = v5 + v4;
|
|
t12 = v6 - v7;
|
|
v7 += v6;
|
|
v5 = ((t11 - v7) * m13) >> 12;
|
|
v7 += t11;
|
|
t13 = ((t10 + t12) * m5) >> 12;
|
|
v4 = t13 - ((t10 * m2) >> 12);
|
|
v6 = t13 - ((t12 * m4) >> 12) - v7;
|
|
v5 -= v6;
|
|
v4 -= v5;
|
|
|
|
// Descale the transformed values 8 bits and output a row
|
|
dst[idx] = ((v0 + v7) >> 8) as i16;
|
|
dst[idx + 7] = ((v0 - v7) >> 8) as i16;
|
|
dst[idx + 1] = ((v1 + v6) >> 8) as i16;
|
|
dst[idx + 6] = ((v1 - v6) >> 8) as i16;
|
|
dst[idx + 2] = ((v2 + v5) >> 8) as i16;
|
|
dst[idx + 5] = ((v2 - v5) >> 8) as i16;
|
|
dst[idx + 3] = ((v3 + v4) >> 8) as i16;
|
|
dst[idx + 4] = ((v3 - v4) >> 8) as i16;
|
|
}
|
|
}
|
|
|
|
/// Load all blocks in an MCU into working buffer
|
|
/// `self`: decompressor object reference
|
|
fn mcu_load(&mut self, input_func: &mut dyn JpegInput) -> Result<(), Error> {
|
|
let mut d: i32;
|
|
let mut e: i32;
|
|
let mut blk: u32;
|
|
let mut bc: u32;
|
|
let mut z: u32;
|
|
let mut id: u32;
|
|
let mut cmp: u32;
|
|
let nby = (self.msx as i32 * self.msy as i32) as u32; // Number of Y blocks (1, 2 or 4)
|
|
let mut mcu_buf_idx = 0; // Pointer to the first block of MCU
|
|
blk = 0;
|
|
while blk < nby + 2 {
|
|
// Get nby Y blocks and two C blocks
|
|
cmp = if blk < nby { 0 } else { blk - nby + 1 }; // Component number 0:Y, 1:Cb, 2:Cr
|
|
if cmp != 0 && self.ncomp as i32 != 3 {
|
|
// Clear C blocks if not exist (monochrome image)
|
|
for i in 0..64 {
|
|
self.mcubuf[mcu_buf_idx + i] = 128;
|
|
}
|
|
} else {
|
|
// Load Y/C blocks from input stream
|
|
id = if cmp != 0 { 1 } else { 0 }; // Huffman table ID of this component
|
|
|
|
// Extract a DC element from input stream
|
|
d = self.huffext(id as usize, 0, input_func)?; // Extract a huffman coded data (bit length)
|
|
bc = d as u32;
|
|
d = self.dcv[cmp as usize] as i32; // DC value of previous block
|
|
if bc != 0 {
|
|
// If there is any difference from previous block
|
|
e = self.bitext(bc, input_func)?; // Extract data bits
|
|
bc = 1 << (bc - 1); // MSB position
|
|
if e as u32 & bc == 0 {
|
|
e -= ((bc << 1) - 1) as i32; // Restore negative value
|
|
// if
|
|
// needed
|
|
}
|
|
d += e; // Get current value
|
|
self.dcv[cmp as usize] = d as i16; // Save current DC value
|
|
// for
|
|
// next block
|
|
}
|
|
// De-quantizer table ID for this component
|
|
let dqidx = self.qtid[cmp as usize] as usize;
|
|
if dqidx >= NUM_DEQUANTIZER_TABLES {
|
|
return Err(Error::InvalidData);
|
|
}
|
|
// De-quantize, apply scale factor of Arai algorithm and descale 8 bits
|
|
let dfq = &self.qttbl[dqidx];
|
|
self.workbuf[0] = (d * dfq[0]) >> 8;
|
|
|
|
// Extract following 63 AC elements from input stream
|
|
self.workbuf[1..64].fill(0); // Initialize all AC elements
|
|
z = 1; // Top of the AC elements (in zigzag-order)
|
|
loop {
|
|
// Extract a huffman coded value (zero runs and bit length)
|
|
d = self.huffext(id as usize, 1, input_func)?;
|
|
if d == 0 {
|
|
// EOB?
|
|
break;
|
|
}
|
|
bc = d as u32;
|
|
z += bc >> 4; // Skip leading zero run
|
|
if z >= 64 {
|
|
// Too long zero run
|
|
return Err(Error::InvalidData);
|
|
}
|
|
bc &= 0xf;
|
|
if bc != 0 {
|
|
// Bit length?
|
|
d = self.bitext(bc, input_func)?; // Extract data bits
|
|
bc = 1 << (bc - 1); // MSB position
|
|
if d as u32 & bc == 0 {
|
|
// Restore negative value if needed
|
|
d -= ((bc << 1) - 1) as i32;
|
|
}
|
|
let i = ZIG[z as usize] as u32; // Get raster-order index
|
|
// De-quantize, apply scale factor of Arai algorithm and descale 8 bits
|
|
let dqidx = self.qtid[cmp as usize] as usize;
|
|
if dqidx >= NUM_DEQUANTIZER_TABLES {
|
|
return Err(Error::InvalidData);
|
|
}
|
|
let dfq = &self.qttbl[dqidx];
|
|
self.workbuf[i as usize] = (d * dfq[i as usize]) >> 8;
|
|
}
|
|
z += 1;
|
|
if z >= 64 {
|
|
break;
|
|
}
|
|
}
|
|
|
|
// C components may not be processed if in grayscale output
|
|
if JD_FORMAT != 2 || cmp == 0 {
|
|
// If no AC element or scale ratio is 1/8, IDCT can be omitted and the block is
|
|
// filled with DC value
|
|
if z == 1 || JD_USE_SCALE != 0 && self.scale == 3 {
|
|
d = self.workbuf[0] / 256 + 128;
|
|
if JD_FASTDECODE >= 1 {
|
|
for i in 0..64 {
|
|
self.mcubuf[mcu_buf_idx + i] = d as i16;
|
|
}
|
|
} else {
|
|
self.mcubuf[..64].fill(d as i16);
|
|
}
|
|
} else {
|
|
// Apply IDCT and store the block to the MCU buffer
|
|
Self::block_idct(self.workbuf, &mut self.mcubuf[mcu_buf_idx..]);
|
|
}
|
|
}
|
|
}
|
|
mcu_buf_idx += 64; // Next block
|
|
blk += 1;
|
|
}
|
|
Ok(()) // All blocks have been loaded successfully
|
|
}
|
|
|
|
/// Output an MCU: Convert YCrCb to RGB and output it in RGB form
|
|
/// `self`: decompressor object reference
|
|
/// `x`: MCU location in the image
|
|
/// `y`: MCU location in the image
|
|
fn mcu_output(
|
|
&mut self,
|
|
mut x: u32,
|
|
mut y: u32,
|
|
output_func: &mut dyn JpegOutput,
|
|
) -> Result<(), Error> {
|
|
// Adaptive accuracy for both 16-/32-bit systems
|
|
let cvacc: i32 = if mem::size_of::<i32>() > 2 { 1024 } else { 128 };
|
|
let mut yy: i32;
|
|
let mut cb: i32;
|
|
let mut cr: i32;
|
|
let mut py_idx: usize;
|
|
let mut pc_idx: usize;
|
|
|
|
// MCU size (pixel)
|
|
let mut mx = (self.msx as i32 * 8) as u32;
|
|
let my = (self.msy as i32 * 8) as u32;
|
|
|
|
// Output rectangular size (it may be clipped at right/bottom end of image)
|
|
let mut rx = if (x + mx) <= self.width as u32 {
|
|
mx
|
|
} else {
|
|
self.width as u32 - x
|
|
};
|
|
let mut ry = if (y + my) <= self.height as u32 {
|
|
my
|
|
} else {
|
|
self.height as u32 - y
|
|
};
|
|
if JD_USE_SCALE != 0 {
|
|
rx >>= self.scale;
|
|
ry >>= self.scale;
|
|
if rx == 0 || ry == 0 {
|
|
// Skip this MCU if all pixel is to be rounded off
|
|
return Ok(());
|
|
}
|
|
x >>= self.scale;
|
|
y >>= self.scale;
|
|
}
|
|
let rect_origin = (x, y);
|
|
let rect_size = (rx, ry);
|
|
|
|
// SAFETY: Aligning to u8 slice is safe, because the original slice is aligned
|
|
// to 32 bits, therefore there are also no residuals (prefix/suffix).
|
|
// The data in the slices are integers, so these are valid for both i32
|
|
// and u8.
|
|
let (_, workbuf, _) = unsafe { self.workbuf.align_to_mut::<u8>() };
|
|
|
|
let mut pix_idx: usize = 0;
|
|
let mut op_idx: usize;
|
|
|
|
if JD_USE_SCALE == 0 || self.scale != 3 {
|
|
// Not for 1/8 scaling
|
|
if JD_FORMAT != 2 {
|
|
// RGB output (build an RGB MCU from Y/C component)
|
|
for iy in 0..my {
|
|
py_idx = 0;
|
|
pc_idx = 0;
|
|
if my == 16 {
|
|
// Double block height?
|
|
pc_idx += (64 * 4) + ((iy as usize >> 1) * 8);
|
|
if iy >= 8 {
|
|
py_idx += 64;
|
|
}
|
|
} else {
|
|
// Single block height
|
|
pc_idx += (mx * 8 + iy * 8) as usize;
|
|
}
|
|
py_idx += (iy * 8) as usize;
|
|
for ix in 0..mx {
|
|
cb = self.mcubuf[pc_idx] as i32 - 128; // Get Cb/Cr component and remove offset
|
|
cr = self.mcubuf[pc_idx + 64] as i32 - 128;
|
|
if mx == 16 {
|
|
// Double block width?
|
|
if ix == 8 {
|
|
// Jump to next block if double block height
|
|
py_idx += 64 - 8;
|
|
}
|
|
// Step forward chroma pointer every two pixels
|
|
pc_idx += (ix & 1) as usize;
|
|
} else {
|
|
// Single block width
|
|
// Step forward chroma pointer every pixel
|
|
pc_idx += 1;
|
|
}
|
|
// Get Y component
|
|
yy = self.mcubuf[py_idx] as i32;
|
|
py_idx += 1;
|
|
// R
|
|
workbuf[pix_idx] = (yy + (1.402f64 * cvacc as f64) as i32 * cr / cvacc)
|
|
.clamp(0, 255) as u8;
|
|
pix_idx += 1;
|
|
// G
|
|
workbuf[pix_idx] = (yy
|
|
- ((0.344f64 * cvacc as f64) as i32 * cb
|
|
+ (0.714f64 * cvacc as f64) as i32 * cr)
|
|
/ cvacc)
|
|
.clamp(0, 255) as u8;
|
|
pix_idx += 1;
|
|
// B
|
|
workbuf[pix_idx] = (yy + (1.772f64 * cvacc as f64) as i32 * cb / cvacc)
|
|
.clamp(0, 255) as u8;
|
|
pix_idx += 1;
|
|
}
|
|
}
|
|
} else {
|
|
// Monochrome output (build a grayscale MCU from Y comopnent)
|
|
|
|
for iy in 0..my {
|
|
py_idx = (iy * 8) as usize;
|
|
if my == 16 && iy >= 8 {
|
|
// Double block height?
|
|
py_idx += 64;
|
|
}
|
|
for ix in 0..mx {
|
|
if mx == 16 && ix == 8 {
|
|
// Double block width?
|
|
// Jump to next block if double block height
|
|
py_idx += 64 - 8;
|
|
}
|
|
// Get and store a Y value as grayscale
|
|
workbuf[pix_idx] = self.mcubuf[py_idx] as u8;
|
|
pix_idx += 1;
|
|
py_idx += 1;
|
|
}
|
|
}
|
|
}
|
|
// Descale the MCU rectangular if needed
|
|
if JD_USE_SCALE != 0 && self.scale != 0 {
|
|
// Get averaged RGB value of each square corresponds to a pixel
|
|
let s = (self.scale * 2) as u32; // Number of shifts for averaging
|
|
let w = 1 << self.scale as u32; // Width of square
|
|
let a = (mx - w) * (if JD_FORMAT != 2 { 3 } else { 1 }); // Bytes to skip for next line in the square
|
|
op_idx = 0;
|
|
for iy in (0..my).step_by(w as usize) {
|
|
for ix in (0..mx).step_by(w as usize) {
|
|
pix_idx = ((iy * mx + ix) * (if JD_FORMAT != 2 { 3 } else { 1 })) as usize;
|
|
let mut b = 0;
|
|
let mut g = 0;
|
|
let mut r = 0;
|
|
for _ in 0..w {
|
|
// Accumulate RGB value in the square
|
|
for _ in 0..w {
|
|
// Accumulate R or Y (monochrome output)
|
|
r += workbuf[pix_idx] as u32;
|
|
pix_idx += 1;
|
|
if JD_FORMAT != 2 {
|
|
// Accumulate G
|
|
g += workbuf[pix_idx] as u32;
|
|
pix_idx += 1;
|
|
// Accumulate B
|
|
b += workbuf[pix_idx] as u32;
|
|
pix_idx += 1;
|
|
}
|
|
}
|
|
pix_idx += a as usize;
|
|
}
|
|
// Put the averaged pixel value
|
|
// Put R or Y (monochrome output)
|
|
workbuf[op_idx] = (r >> s) as u8;
|
|
op_idx += 1;
|
|
if JD_FORMAT != 2 {
|
|
// RGB output?
|
|
// Put G
|
|
workbuf[op_idx] = (g >> s) as u8;
|
|
op_idx += 1;
|
|
// Put B
|
|
workbuf[op_idx] = (b >> s) as u8;
|
|
op_idx += 1;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
} else {
|
|
// For only 1/8 scaling (left-top pixel in each block are the DC value of the
|
|
// block) Build a 1/8 descaled RGB MCU from discrete components
|
|
pix_idx = 0;
|
|
pc_idx = (mx * my) as usize;
|
|
cb = self.mcubuf[pc_idx] as i32 - 128; // Get Cb/Cr component and restore right level
|
|
cr = self.mcubuf[pc_idx + 64] as i32 - 128;
|
|
|
|
for iy in (0..my).step_by(8) {
|
|
py_idx = 0;
|
|
if iy == 8 {
|
|
py_idx = 64 * 2;
|
|
}
|
|
for _ in (0..mx).step_by(8) {
|
|
// Get Y component
|
|
yy = self.mcubuf[py_idx] as i32;
|
|
py_idx += 64;
|
|
if JD_FORMAT != 2 {
|
|
// R
|
|
workbuf[pix_idx] = (yy + (1.402f64 * cvacc as f64) as i32 * cr / cvacc)
|
|
.clamp(0, 255) as u8;
|
|
pix_idx += 1;
|
|
// G
|
|
workbuf[pix_idx] = (yy
|
|
- ((0.344f64 * cvacc as f64) as i32 * cb
|
|
+ (0.714f64 * cvacc as f64) as i32 * cr)
|
|
/ cvacc)
|
|
.clamp(0, 255) as u8;
|
|
//B
|
|
pix_idx += 1;
|
|
workbuf[pix_idx] = (yy + (1.772f64 * cvacc as f64) as i32 * cb / cvacc)
|
|
.clamp(0, 255) as u8;
|
|
pix_idx += 1;
|
|
} else {
|
|
workbuf[pix_idx] = yy as u8;
|
|
pix_idx += 1;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// Squeeze up pixel table if a part of MCU is to be truncated
|
|
mx >>= self.scale as i32;
|
|
if rx < mx {
|
|
// Is the MCU spans right edge?
|
|
let mut s_0_idx = 0;
|
|
let mut d_idx = 0;
|
|
for _ in 0..ry {
|
|
for _ in 0..rx {
|
|
// Copy effective pixels
|
|
workbuf[d_idx] = workbuf[s_0_idx];
|
|
s_0_idx += 1;
|
|
d_idx += 1;
|
|
if JD_FORMAT != 2 {
|
|
workbuf[d_idx] = workbuf[s_0_idx];
|
|
s_0_idx += 1;
|
|
d_idx += 1;
|
|
workbuf[d_idx] = workbuf[s_0_idx];
|
|
s_0_idx += 1;
|
|
d_idx += 1;
|
|
}
|
|
}
|
|
// Skip truncated pixels
|
|
s_0_idx += ((mx - rx) * (if JD_FORMAT != 2 { 3 } else { 1 })) as usize;
|
|
}
|
|
}
|
|
|
|
// Convert RGB888 to RGB565 if needed
|
|
if JD_FORMAT == 1 {
|
|
let mut s_1_idx = 0;
|
|
let mut d_0_idx = 0;
|
|
let mut w_0: u16;
|
|
for _ in 0..rx * ry {
|
|
// RRRRR-----------
|
|
w_0 = ((workbuf[s_1_idx] as i32 & 0xf8) << 8) as u16;
|
|
s_1_idx += 1;
|
|
// -----GGGGGG-----
|
|
w_0 = (w_0 as i32 | (workbuf[s_1_idx] as i32 & 0xfc) << 3) as u16;
|
|
s_1_idx += 1;
|
|
// -----------BBBBB
|
|
w_0 = (w_0 as i32 | workbuf[s_1_idx] as i32 >> 3) as u16;
|
|
s_1_idx += 1;
|
|
|
|
workbuf[d_0_idx] = (w_0 & 0xFF) as u8;
|
|
workbuf[d_0_idx + 1] = (w_0 >> 8) as u8;
|
|
d_0_idx += 2;
|
|
}
|
|
}
|
|
|
|
// Output the rectangular
|
|
// SAFETY: Aligning to u16 slice is safe, because the original slice is aligned
|
|
// to 32 bits, therefore there are also no residuals (prefix/suffix).
|
|
// The data in the slices are integers, so these are valid for both i32
|
|
// and u16.
|
|
let (_, bitmap, _) = unsafe { self.workbuf.align_to::<u16>() };
|
|
let bitmap = &bitmap[..(rect_size.0 * rect_size.1) as usize];
|
|
if output_func.write(self, rect_origin, rect_size, bitmap) {
|
|
Ok(())
|
|
} else {
|
|
Err(Error::Interrupted)
|
|
}
|
|
}
|
|
|
|
pub fn mcu_height(&self) -> i16 {
|
|
self.msy as i16 * 8
|
|
}
|
|
|
|
pub fn width(&self) -> i16 {
|
|
self.width as i16
|
|
}
|
|
|
|
pub fn height(&self) -> i16 {
|
|
self.height as i16
|
|
}
|
|
|
|
pub fn set_scale(&mut self, scale: u8) -> Result<(), Error> {
|
|
if scale > (if JD_USE_SCALE != 0 { 3 } else { 0 }) {
|
|
return Err(Error::Parameter);
|
|
}
|
|
self.scale = scale;
|
|
Ok(())
|
|
}
|
|
|
|
/// Analyze the JPEG image and Initialize decompressor object
|
|
pub fn new(input_func: &mut dyn JpegInput, pool: &'p mut [u8]) -> Result<Self, Error> {
|
|
let mut jd = JDEC {
|
|
dctr: 0,
|
|
dptr: 0,
|
|
inbuf: &mut [],
|
|
dbit: 0,
|
|
scale: 0,
|
|
msx: 0,
|
|
msy: 0,
|
|
qtid: [0; 3],
|
|
pool,
|
|
dcv: [0; 3],
|
|
rsc: 0,
|
|
width: 0,
|
|
height: 0,
|
|
huffbits: [[&mut [], &mut []], [&mut [], &mut []]],
|
|
huffcode: [[&mut [], &mut []], [&mut [], &mut []]],
|
|
huffcode_len: [[0; 2]; 2],
|
|
huffdata: [[&mut [], &mut []], [&mut [], &mut []]],
|
|
qttbl: [&mut [], &mut [], &mut [], &mut []],
|
|
wreg: 0,
|
|
marker: 0,
|
|
longofs: [[0; 2]; 2],
|
|
hufflut_ac: [&mut [], &mut []],
|
|
hufflut_dc: [&mut [], &mut []],
|
|
workbuf: &mut [],
|
|
rst: 0,
|
|
ncomp: 0,
|
|
nrst: 0,
|
|
mcubuf: &mut [],
|
|
mcu_x: 0,
|
|
mcu_y: 0,
|
|
};
|
|
|
|
let mut marker: u16;
|
|
let mut ofs: u32;
|
|
let mut len: usize;
|
|
|
|
// Allocate stream input buffer
|
|
jd.inbuf = jd.alloc_slice(JD_SZBUF)?;
|
|
|
|
// Find SOI marker
|
|
marker = 0;
|
|
ofs = marker as u32;
|
|
loop {
|
|
if jd.jpeg_in(Some(0), 1, input_func) != 1 {
|
|
// Err: SOI was not detected
|
|
return Err(Error::Input);
|
|
}
|
|
ofs += 1;
|
|
marker = ((marker as i32) << 8 | jd.inbuf[0] as i32) as u16;
|
|
if marker == 0xffd8 {
|
|
break;
|
|
}
|
|
}
|
|
loop {
|
|
// Parse JPEG segments
|
|
// Get a JPEG marker
|
|
if jd.jpeg_in(Some(0), 4, input_func) != 4 {
|
|
return Err(Error::Input);
|
|
}
|
|
// Marker
|
|
marker = ((jd.inbuf[0] as i32) << 8 | jd.inbuf[1] as i32) as u16;
|
|
// Length field
|
|
len = ((jd.inbuf[2] as i32) << 8 | jd.inbuf[3] as i32) as usize;
|
|
if len <= 2 || marker >> 8 != 0xff {
|
|
return Err(Error::InvalidData);
|
|
}
|
|
len -= 2; // Segment content size
|
|
ofs += (4 + len) as u32; // Number of bytes loaded
|
|
|
|
match marker & 0xff {
|
|
0xC0 => {
|
|
// SOF0 (baseline JPEG)
|
|
if len > JD_SZBUF {
|
|
return Err(Error::MemoryInput);
|
|
}
|
|
// Load segment data
|
|
if jd.jpeg_in(Some(0), len, input_func) != len {
|
|
return Err(Error::Input);
|
|
}
|
|
// Image width in unit of pixel
|
|
jd.width = ((jd.inbuf[3] as i32) << 8 | jd.inbuf[4] as i32) as u16;
|
|
// Image height in unit of pixel
|
|
jd.height = ((jd.inbuf[1] as i32) << 8 | jd.inbuf[2] as i32) as u16;
|
|
// Number of color components
|
|
jd.ncomp = jd.inbuf[5];
|
|
if jd.ncomp != 3 && jd.ncomp != 1 {
|
|
// Err: Supports only Grayscale and Y/Cb/Cr
|
|
return Err(Error::UnsupportedJpeg);
|
|
}
|
|
// Check each image component
|
|
for i in 0..jd.ncomp as usize {
|
|
// Get sampling factor
|
|
let b = jd.inbuf[7 + 3 * i];
|
|
if i == 0 {
|
|
// Y component
|
|
if b != 0x11 && b != 0x22 && b != 0x21 {
|
|
// Check sampling factor
|
|
// Err: Supports only 4:4:4, 4:2:0 or 4:2:2
|
|
return Err(Error::UnsupportedJpeg);
|
|
}
|
|
// Size of MCU [blocks]
|
|
jd.msx = (b as i32 >> 4) as u8;
|
|
jd.msy = (b as i32 & 15) as u8;
|
|
} else if b as i32 != 0x11 {
|
|
// Cb/Cr component
|
|
// Err: Sampling factor of Cb/Cr must be 1
|
|
return Err(Error::UnsupportedJpeg);
|
|
}
|
|
// Get dequantizer table ID for this component
|
|
jd.qtid[i] = jd.inbuf[8 + 3 * i];
|
|
if jd.qtid[i] as i32 > 3 {
|
|
// Err: Invalid ID
|
|
return Err(Error::UnsupportedJpeg);
|
|
}
|
|
}
|
|
}
|
|
0xDD => {
|
|
// DRI - Define Restart Interval
|
|
if len > JD_SZBUF {
|
|
return Err(Error::MemoryInput);
|
|
}
|
|
// Load segment data
|
|
if jd.jpeg_in(Some(0), len, input_func) != len {
|
|
return Err(Error::Input);
|
|
}
|
|
// Get restart interval (MCUs)
|
|
jd.nrst = ((jd.inbuf[0] as i32) << 8 | jd.inbuf[1] as i32) as u16;
|
|
}
|
|
0xC4 => {
|
|
// DHT - Define Huffman Tables
|
|
if len > JD_SZBUF {
|
|
return Err(Error::MemoryInput);
|
|
}
|
|
// Load segment data
|
|
if jd.jpeg_in(Some(0), len, input_func) != len {
|
|
return Err(Error::Input);
|
|
}
|
|
// Create huffman tables
|
|
jd.create_huffman_tbl(len)?;
|
|
}
|
|
0xDB => {
|
|
// DQT - Define Quantizer Tables
|
|
if len > JD_SZBUF {
|
|
return Err(Error::MemoryInput);
|
|
}
|
|
// Load segment data
|
|
if jd.jpeg_in(Some(0), len, input_func) != len {
|
|
return Err(Error::Input);
|
|
}
|
|
// Create de-quantizer tables
|
|
jd.create_qt_tbl(len)?;
|
|
}
|
|
0xDA => {
|
|
// SOS - Start of Scan
|
|
if len > JD_SZBUF {
|
|
return Err(Error::MemoryInput);
|
|
}
|
|
// Load segment data
|
|
if jd.jpeg_in(Some(0), len, input_func) != len {
|
|
return Err(Error::Input);
|
|
}
|
|
if jd.width == 0 || jd.height == 0 {
|
|
// Err: Invalid image size
|
|
return Err(Error::InvalidData);
|
|
}
|
|
if jd.inbuf[0] as i32 != jd.ncomp as i32 {
|
|
// Err: Wrong color components
|
|
return Err(Error::UnsupportedJpeg);
|
|
}
|
|
// Check if all tables corresponding to each components have been loaded
|
|
for i in 0..jd.ncomp as usize {
|
|
// Get huffman table ID
|
|
let b = jd.inbuf[2 + 2 * i];
|
|
if b != 0 && b != 0x11 {
|
|
// Err: Different table number for DC/AC element
|
|
return Err(Error::UnsupportedJpeg);
|
|
}
|
|
let n = if i != 0 { 1 } else { 0 }; // Component class
|
|
|
|
// Check huffman table for this component
|
|
if (jd.huffbits[n][0]).is_empty() || (jd.huffbits[n][1]).is_empty() {
|
|
// Err: Not loaded
|
|
return Err(Error::InvalidData);
|
|
}
|
|
// Check dequantizer table for this component
|
|
if (jd.qttbl[jd.qtid[i] as usize]).is_empty() {
|
|
// Err: Not loaded
|
|
return Err(Error::InvalidData);
|
|
}
|
|
}
|
|
// Allocate working buffer for MCU and pixel output
|
|
let n = jd.msy as i32 * jd.msx as i32; // Number of Y blocks in the MCU
|
|
if n == 0 {
|
|
// Err: SOF0 has not been loaded
|
|
return Err(Error::InvalidData);
|
|
}
|
|
len = (n * 64 * 3 + 64) as usize; // Allocate buffer for IDCT and RGB output
|
|
if len < 256 {
|
|
// but at least 256 byte is required for IDCT
|
|
len = 256;
|
|
}
|
|
|
|
jd.workbuf = jd.alloc_slice(len / 4)?;
|
|
|
|
// Allocate MCU working buffer
|
|
jd.mcubuf = jd.alloc_slice((n as usize + 2) * 64)?;
|
|
|
|
// Align stream read offset to JD_SZBUF
|
|
ofs %= JD_SZBUF as u32;
|
|
if ofs != 0 {
|
|
jd.dctr = jd.jpeg_in(Some(ofs as usize), (JD_SZBUF as u32 - ofs) as usize, input_func);
|
|
}
|
|
jd.dptr = (ofs - (if JD_FASTDECODE != 0 { 0 } else { 1 })) as usize;
|
|
return Ok(jd); // Initialization succeeded. Ready to
|
|
// decompress the JPEG image.
|
|
}
|
|
// SOF1, SOF2, SOF3, SOF5, SOF6, SOF7, SOF9, SOF10, SOF11, SOF13, SOF14, SOF15, EOI
|
|
0xC1 | 0xC2 | 0xC3 | 0xC5 | 0xC6 | 0xC7 | 0xC9 | 0xCA | 0xCB | 0xCD | 0xCF
|
|
| 0xCE | 0xD9 => {
|
|
// Unsupported JPEG standard (may be progressive JPEG)
|
|
return Err(Error::UnsupportedJpeg);
|
|
}
|
|
_ => {
|
|
// Unknown segment (comment, exif or etc..)
|
|
// Skip segment data (null pointer specifies to remove data from the stream)
|
|
if jd.jpeg_in(None, len, input_func) != len {
|
|
return Err(Error::Input);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Start/resume JPEG decompression
|
|
///
|
|
/// The function decompress the JPEG image in stream and calls
|
|
/// the output function for each decoded MCU.
|
|
///
|
|
/// If the output function returns `false`, the decompression is interrupted.
|
|
/// It's possible later to call `decomp()` again to resume the decompression.
|
|
pub fn decomp(&mut self, input_func: &mut dyn JpegInput, output_func: &mut dyn JpegOutput) -> Result<(), Error> {
|
|
let mx = self.msx as u16 * 8; // Size of the MCU (pixel)
|
|
let my = self.msy as u16 * 8; // Size of the MCU (pixel)
|
|
while self.mcu_y < self.height {
|
|
if self.nrst != 0 && {
|
|
// Process restart interval if enabled
|
|
let val = self.rst;
|
|
self.rst += 1;
|
|
val == self.nrst
|
|
} {
|
|
let val = self.rsc;
|
|
self.rsc += 1;
|
|
self.restart(val, input_func)?;
|
|
self.rst = 1;
|
|
}
|
|
|
|
// Load an MCU (decompress huffman coded stream, dequantize and apply IDCT)
|
|
self.mcu_load(input_func)?;
|
|
|
|
let x = self.mcu_x as u32;
|
|
let y = self.mcu_y as u32;
|
|
|
|
self.mcu_x += mx;
|
|
if self.mcu_x >= self.width {
|
|
self.mcu_x = 0;
|
|
self.mcu_y += my;
|
|
}
|
|
|
|
// Output the MCU (YCbCr to RGB, scaling and output)
|
|
self.mcu_output(x, y, output_func)?;
|
|
}
|
|
Ok(())
|
|
}
|
|
|
|
/// Returns pixel coordinates (top-left) of the next decoded MCU
|
|
///
|
|
/// The function is useful when the decompression is interrupted
|
|
/// and later resumed by `decomp()`.
|
|
pub fn next_mcu(&self) -> (u16, u16) {
|
|
(self.mcu_x, self.mcu_y)
|
|
}
|
|
|
|
}
|
|
|
|
pub trait JpegInput {
|
|
fn read(&mut self, buf: Option<&mut [u8]>, nread: usize) -> usize;
|
|
}
|
|
|
|
pub struct BufferInput<'i>(pub &'i [u8]);
|
|
|
|
impl<'i> JpegInput for BufferInput<'i> {
|
|
fn read(&mut self, inbuf: Option<&mut [u8]>, n_data: usize) -> usize {
|
|
let len = n_data.min(self.0.len());
|
|
let (toread, newdata) = self.0.split_at(len);
|
|
if let Some(inbuf) = inbuf {
|
|
(inbuf[..len]).copy_from_slice(toread)
|
|
}
|
|
self.0 = newdata;
|
|
len
|
|
}
|
|
}
|
|
|
|
pub trait JpegOutput {
|
|
/// Return `false` to interrupt.
|
|
fn write(
|
|
&mut self,
|
|
jd: &JDEC,
|
|
rect_origin: (u32, u32),
|
|
rect_size: (u32, u32),
|
|
pixels: &[u16],
|
|
) -> bool;
|
|
}
|
|
|
|
pub struct BlackHoleOutput;
|
|
|
|
impl JpegOutput for BlackHoleOutput {
|
|
fn write(
|
|
&mut self,
|
|
_jd: &JDEC,
|
|
_rect_origin: (u32, u32),
|
|
_rect_size: (u32, u32),
|
|
_bitmap: &[u16],
|
|
) -> bool {
|
|
true
|
|
}
|
|
}
|