feat(pdftract-byq): implement direct image compositing path (Phase 5.2.1)
Implements the default-feature image rendering path for scanned PDFs: - Walk content stream operators and collect image XObjects with CTMs - Decode image XObjects (JPEG, RGB, grayscale, CMYK) via Phase 1.5 - Composite images onto canvas using CTM-based pixel placement - Support page rotation (0, 90, 180, 270 degrees) - Handle Y-flip CTMs (common in PDFs) - Emit IMG_SOFTMASK_UNSUPPORTED diagnostic for soft-masked images Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
This commit is contained in:
parent
dacda5bcfd
commit
e2d2eded65
5 changed files with 1361 additions and 1 deletions
|
|
@ -10,6 +10,7 @@ publish = true
|
||||||
[dependencies]
|
[dependencies]
|
||||||
anyhow = { workspace = true }
|
anyhow = { workspace = true }
|
||||||
hex = "0.4"
|
hex = "0.4"
|
||||||
|
image = { version = "0.25", optional = true }
|
||||||
indexmap = "2.2"
|
indexmap = "2.2"
|
||||||
flate2 = { workspace = true }
|
flate2 = { workspace = true }
|
||||||
lzw = { workspace = true }
|
lzw = { workspace = true }
|
||||||
|
|
@ -31,6 +32,7 @@ phf = "0.11"
|
||||||
default = ["serde"]
|
default = ["serde"]
|
||||||
serde = ["dep:serde", "dep:serde_json"]
|
serde = ["dep:serde", "dep:serde_json"]
|
||||||
receipts = [] # Enable visual citation receipts (SVG clip generation)
|
receipts = [] # Enable visual citation receipts (SVG clip generation)
|
||||||
|
ocr = ["dep:image"] # Enable OCR path (image compositing)
|
||||||
proptest = []
|
proptest = []
|
||||||
fuzzing = [] # Enable cfg(fuzzing) for fuzz harnesses
|
fuzzing = [] # Enable cfg(fuzzing) for fuzz harnesses
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -305,6 +305,14 @@ pub enum DiagCode {
|
||||||
/// Phase origin: 1.7
|
/// Phase origin: 1.7
|
||||||
StructInvalidGeometry,
|
StructInvalidGeometry,
|
||||||
|
|
||||||
|
/// Invalid object type (expected type not found)
|
||||||
|
///
|
||||||
|
/// Emitted when an object is not the expected type (e.g., expecting a stream
|
||||||
|
/// but finding a dictionary). The object is treated as null.
|
||||||
|
///
|
||||||
|
/// Phase origin: 5.2.1
|
||||||
|
StructInvalidType,
|
||||||
|
|
||||||
/// Hybrid xref conflict: traditional table and stream disagree on object state
|
/// Hybrid xref conflict: traditional table and stream disagree on object state
|
||||||
///
|
///
|
||||||
/// Emitted when merging a hybrid file's xref sections and the traditional
|
/// Emitted when merging a hybrid file's xref sections and the traditional
|
||||||
|
|
@ -580,6 +588,31 @@ pub enum DiagCode {
|
||||||
/// Phase origin: 4.7
|
/// Phase origin: 4.7
|
||||||
OcrBrokenVectorUnavailable,
|
OcrBrokenVectorUnavailable,
|
||||||
|
|
||||||
|
/// Image soft mask not supported in direct compositing path
|
||||||
|
///
|
||||||
|
/// Emitted when an image XObject has a /SMask entry. Direct compositing
|
||||||
|
/// doesn't support soft masks; use `full-render` feature for proper rendering.
|
||||||
|
/// The masked image is skipped.
|
||||||
|
///
|
||||||
|
/// Phase origin: 5.2.1
|
||||||
|
ImgSoftmaskUnsupported,
|
||||||
|
|
||||||
|
/// Image format not supported
|
||||||
|
///
|
||||||
|
/// Emitted when an image XObject uses an unsupported format or bits-per-component
|
||||||
|
/// value. The image is skipped.
|
||||||
|
///
|
||||||
|
/// Phase origin: 5.2.1
|
||||||
|
ImgUnsupportedFormat,
|
||||||
|
|
||||||
|
/// Stream data truncated
|
||||||
|
///
|
||||||
|
/// Emitted when a stream has less data than expected based on its declared
|
||||||
|
/// dimensions and color space. Partial data is used.
|
||||||
|
///
|
||||||
|
/// Phase origin: 1.5 / 5.2.1
|
||||||
|
StreamTruncated,
|
||||||
|
|
||||||
// === REMOTE_* codes ===
|
// === REMOTE_* codes ===
|
||||||
|
|
||||||
/// HTTP fetch interrupted or failed
|
/// HTTP fetch interrupted or failed
|
||||||
|
|
@ -721,6 +754,7 @@ impl DiagCode {
|
||||||
| DiagCode::StructIntegerOverflow
|
| DiagCode::StructIntegerOverflow
|
||||||
| DiagCode::StructInvalidObjstm
|
| DiagCode::StructInvalidObjstm
|
||||||
| DiagCode::StructInvalidGeometry
|
| DiagCode::StructInvalidGeometry
|
||||||
|
| DiagCode::StructInvalidType
|
||||||
| DiagCode::StructInvalidUtf16
|
| DiagCode::StructInvalidUtf16
|
||||||
| DiagCode::StructUnresolvedDestination
|
| DiagCode::StructUnresolvedDestination
|
||||||
| DiagCode::StructNonGotoOutline
|
| DiagCode::StructNonGotoOutline
|
||||||
|
|
@ -747,7 +781,8 @@ impl DiagCode {
|
||||||
DiagCode::StreamDecodeError
|
DiagCode::StreamDecodeError
|
||||||
| DiagCode::StreamBomb
|
| DiagCode::StreamBomb
|
||||||
| DiagCode::StreamUnknownFilter
|
| DiagCode::StreamUnknownFilter
|
||||||
| DiagCode::StreamInvalidParams => "STREAM",
|
| DiagCode::StreamInvalidParams
|
||||||
|
| DiagCode::StreamTruncated => "STREAM",
|
||||||
|
|
||||||
// ENCRYPTION_*
|
// ENCRYPTION_*
|
||||||
DiagCode::EncryptionUnsupported | DiagCode::EncryptionWrongPassword => "ENCRYPTION",
|
DiagCode::EncryptionUnsupported | DiagCode::EncryptionWrongPassword => "ENCRYPTION",
|
||||||
|
|
@ -772,6 +807,10 @@ impl DiagCode {
|
||||||
| DiagCode::OcrTesseractFailed
|
| DiagCode::OcrTesseractFailed
|
||||||
| DiagCode::OcrBrokenVectorUnavailable => "OCR",
|
| DiagCode::OcrBrokenVectorUnavailable => "OCR",
|
||||||
|
|
||||||
|
// IMG_*
|
||||||
|
DiagCode::ImgSoftmaskUnsupported
|
||||||
|
| DiagCode::ImgUnsupportedFormat => "IMG",
|
||||||
|
|
||||||
// REMOTE_*
|
// REMOTE_*
|
||||||
DiagCode::RemoteFetchInterrupted
|
DiagCode::RemoteFetchInterrupted
|
||||||
| DiagCode::RemoteNoRangeSupport
|
| DiagCode::RemoteNoRangeSupport
|
||||||
|
|
@ -817,6 +856,7 @@ impl DiagCode {
|
||||||
DiagCode::StructIntegerOverflow => "STRUCT_INTEGER_OVERFLOW",
|
DiagCode::StructIntegerOverflow => "STRUCT_INTEGER_OVERFLOW",
|
||||||
DiagCode::StructInvalidObjstm => "STRUCT_INVALID_OBJSTM",
|
DiagCode::StructInvalidObjstm => "STRUCT_INVALID_OBJSTM",
|
||||||
DiagCode::StructInvalidGeometry => "STRUCT_INVALID_GEOMETRY",
|
DiagCode::StructInvalidGeometry => "STRUCT_INVALID_GEOMETRY",
|
||||||
|
DiagCode::StructInvalidType => "STRUCT_INVALID_TYPE",
|
||||||
DiagCode::StructInvalidUtf16 => "STRUCT_INVALID_UTF16",
|
DiagCode::StructInvalidUtf16 => "STRUCT_INVALID_UTF16",
|
||||||
DiagCode::StructUnresolvedDestination => "STRUCT_UNRESOLVED_DESTINATION",
|
DiagCode::StructUnresolvedDestination => "STRUCT_UNRESOLVED_DESTINATION",
|
||||||
DiagCode::StructNonGotoOutline => "STRUCT_NON_GOTO_OUTLINE",
|
DiagCode::StructNonGotoOutline => "STRUCT_NON_GOTO_OUTLINE",
|
||||||
|
|
@ -854,6 +894,9 @@ impl DiagCode {
|
||||||
DiagCode::OcrCcittUnsupported => "OCR_CCITT_UNSUPPORTED",
|
DiagCode::OcrCcittUnsupported => "OCR_CCITT_UNSUPPORTED",
|
||||||
DiagCode::OcrTesseractFailed => "OCR_TESSERACT_FAILED",
|
DiagCode::OcrTesseractFailed => "OCR_TESSERACT_FAILED",
|
||||||
DiagCode::OcrBrokenVectorUnavailable => "OCR_BROKENVECTOR_UNAVAILABLE",
|
DiagCode::OcrBrokenVectorUnavailable => "OCR_BROKENVECTOR_UNAVAILABLE",
|
||||||
|
DiagCode::ImgSoftmaskUnsupported => "IMG_SOFTMASK_UNSUPPORTED",
|
||||||
|
DiagCode::ImgUnsupportedFormat => "IMG_UNSUPPORTED_FORMAT",
|
||||||
|
DiagCode::StreamTruncated => "STREAM_TRUNCATED",
|
||||||
DiagCode::RemoteFetchInterrupted => "REMOTE_FETCH_INTERRUPTED",
|
DiagCode::RemoteFetchInterrupted => "REMOTE_FETCH_INTERRUPTED",
|
||||||
DiagCode::RemoteNoRangeSupport => "REMOTE_NO_RANGE_SUPPORT",
|
DiagCode::RemoteNoRangeSupport => "REMOTE_NO_RANGE_SUPPORT",
|
||||||
DiagCode::RemoteTlsFailed => "REMOTE_TLS_FAILED",
|
DiagCode::RemoteTlsFailed => "REMOTE_TLS_FAILED",
|
||||||
|
|
@ -894,6 +937,7 @@ impl DiagCode {
|
||||||
| DiagCode::StructIntegerOverflow
|
| DiagCode::StructIntegerOverflow
|
||||||
| DiagCode::StructInvalidObjstm
|
| DiagCode::StructInvalidObjstm
|
||||||
| DiagCode::StructInvalidGeometry
|
| DiagCode::StructInvalidGeometry
|
||||||
|
| DiagCode::StructInvalidType
|
||||||
| DiagCode::StructInvalidUtf16
|
| DiagCode::StructInvalidUtf16
|
||||||
| DiagCode::StructUnresolvedDestination
|
| DiagCode::StructUnresolvedDestination
|
||||||
| DiagCode::StructNonGotoOutline
|
| DiagCode::StructNonGotoOutline
|
||||||
|
|
@ -926,6 +970,9 @@ impl DiagCode {
|
||||||
| DiagCode::OcrCcittUnsupported
|
| DiagCode::OcrCcittUnsupported
|
||||||
| DiagCode::OcrTesseractFailed
|
| DiagCode::OcrTesseractFailed
|
||||||
| DiagCode::OcrBrokenVectorUnavailable
|
| DiagCode::OcrBrokenVectorUnavailable
|
||||||
|
| DiagCode::ImgSoftmaskUnsupported
|
||||||
|
| DiagCode::ImgUnsupportedFormat
|
||||||
|
| DiagCode::StreamTruncated
|
||||||
| DiagCode::RemoteNoRangeSupport
|
| DiagCode::RemoteNoRangeSupport
|
||||||
| DiagCode::GstateStackOverflow
|
| DiagCode::GstateStackOverflow
|
||||||
| DiagCode::GstateStackUnderflow
|
| DiagCode::GstateStackUnderflow
|
||||||
|
|
@ -1403,6 +1450,31 @@ pub const DIAGNOSTIC_CATALOG: &[DiagInfo] = &[
|
||||||
phase: "4.7",
|
phase: "4.7",
|
||||||
suggested_action: "Build with --features ocr to enable OCR recovery on broken-vector pages",
|
suggested_action: "Build with --features ocr to enable OCR recovery on broken-vector pages",
|
||||||
},
|
},
|
||||||
|
// === IMG_* codes ===
|
||||||
|
DiagInfo {
|
||||||
|
code: DiagCode::ImgSoftmaskUnsupported,
|
||||||
|
category: "IMG",
|
||||||
|
severity: Severity::Warning,
|
||||||
|
recoverable: true,
|
||||||
|
phase: "5.2.1",
|
||||||
|
suggested_action: "Soft-masked images not supported in direct compositing; use --features full-render for proper rendering",
|
||||||
|
},
|
||||||
|
DiagInfo {
|
||||||
|
code: DiagCode::ImgUnsupportedFormat,
|
||||||
|
category: "IMG",
|
||||||
|
severity: Severity::Warning,
|
||||||
|
recoverable: true,
|
||||||
|
phase: "5.2.1",
|
||||||
|
suggested_action: "Image format or bits-per-component not supported; image is skipped",
|
||||||
|
},
|
||||||
|
DiagInfo {
|
||||||
|
code: DiagCode::StreamTruncated,
|
||||||
|
category: "STREAM",
|
||||||
|
severity: Severity::Warning,
|
||||||
|
recoverable: true,
|
||||||
|
phase: "1.5 / 5.2.1",
|
||||||
|
suggested_action: "Stream has less data than expected; partial data is used",
|
||||||
|
},
|
||||||
// === REMOTE_* codes ===
|
// === REMOTE_* codes ===
|
||||||
DiagInfo {
|
DiagInfo {
|
||||||
code: DiagCode::RemoteFetchInterrupted,
|
code: DiagCode::RemoteFetchInterrupted,
|
||||||
|
|
|
||||||
333
crates/pdftract-core/src/graphics_state.rs
Normal file
333
crates/pdftract-core/src/graphics_state.rs
Normal file
|
|
@ -0,0 +1,333 @@
|
||||||
|
//! Graphics state management for PDF content stream processing.
|
||||||
|
//!
|
||||||
|
//! This module implements the graphics state stack and CTM (Current Transformation Matrix)
|
||||||
|
//! tracking needed for Phase 3 content stream processing and Phase 5.2.1 image compositing.
|
||||||
|
//!
|
||||||
|
//! Per PDF spec section 8.4 "Graphics State":
|
||||||
|
//! - q operator pushes a copy of the current graphics state onto the stack
|
||||||
|
//! - Q operator pops the graphics state stack and restores the state
|
||||||
|
//! - cm operator concatenates a matrix with the CTM
|
||||||
|
//!
|
||||||
|
//! The CTM is a 3x3 transformation matrix that transforms coordinates from user space
|
||||||
|
//! to device space. For 2D operations, only 6 values are relevant: [a b c d e f]
|
||||||
|
//! representing the affine transformation:
|
||||||
|
//! x' = a*x + c*y + e
|
||||||
|
//! y' = b*x + d*y + f
|
||||||
|
|
||||||
|
use crate::diagnostics::{Diagnostic, DiagCode};
|
||||||
|
|
||||||
|
/// Maximum depth of graphics state stack (prevents stack overflow).
|
||||||
|
const MAX_GSTATE_DEPTH: usize = 32;
|
||||||
|
|
||||||
|
/// 3x3 transformation matrix for PDF coordinate transformations.
|
||||||
|
///
|
||||||
|
/// Only the first 6 values are used for 2D affine transformations:
|
||||||
|
/// [a b 0]
|
||||||
|
/// [c d 0]
|
||||||
|
/// [e f 1]
|
||||||
|
///
|
||||||
|
/// Per PDF spec, the CTM transforms from user space to device space.
|
||||||
|
#[derive(Debug, Clone, Copy, PartialEq)]
|
||||||
|
pub struct Matrix3x3 {
|
||||||
|
/// The a coefficient (x scale)
|
||||||
|
pub a: f64,
|
||||||
|
/// The b coefficient (y skew)
|
||||||
|
pub b: f64,
|
||||||
|
/// The c coefficient (x skew)
|
||||||
|
pub c: f64,
|
||||||
|
/// The d coefficient (y scale)
|
||||||
|
pub d: f64,
|
||||||
|
/// The e coefficient (x translation)
|
||||||
|
pub e: f64,
|
||||||
|
/// The f coefficient (y translation)
|
||||||
|
pub f: f64,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Matrix3x3 {
|
||||||
|
/// Create a new identity matrix.
|
||||||
|
#[inline]
|
||||||
|
pub fn identity() -> Self {
|
||||||
|
Self {
|
||||||
|
a: 1.0,
|
||||||
|
b: 0.0,
|
||||||
|
c: 0.0,
|
||||||
|
d: 1.0,
|
||||||
|
e: 0.0,
|
||||||
|
f: 0.0,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Create a matrix from a PDF-style 6-element array [a b c d e f].
|
||||||
|
#[inline]
|
||||||
|
pub fn from_pdf_array(arr: [f64; 6]) -> Self {
|
||||||
|
Self {
|
||||||
|
a: arr[0],
|
||||||
|
b: arr[1],
|
||||||
|
c: arr[2],
|
||||||
|
d: arr[3],
|
||||||
|
e: arr[4],
|
||||||
|
f: arr[5],
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Check if this is the identity matrix.
|
||||||
|
#[inline]
|
||||||
|
pub fn is_identity(&self) -> bool {
|
||||||
|
self.a == 1.0 && self.b == 0.0 && self.c == 0.0 &&
|
||||||
|
self.d == 1.0 && self.e == 0.0 && self.f == 0.0
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Multiply this matrix by another (this * other).
|
||||||
|
#[inline]
|
||||||
|
pub fn multiply(&self, other: &Matrix3x3) -> Matrix3x3 {
|
||||||
|
Matrix3x3 {
|
||||||
|
a: self.a * other.a + self.b * other.c,
|
||||||
|
b: self.a * other.b + self.b * other.d,
|
||||||
|
c: self.c * other.a + self.d * other.c,
|
||||||
|
d: self.c * other.b + self.d * other.d,
|
||||||
|
e: self.e * other.a + self.f * other.c + other.e,
|
||||||
|
f: self.e * other.b + self.f * other.d + other.f,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Transform a point (x, y) by this matrix.
|
||||||
|
#[inline]
|
||||||
|
pub fn transform_point(&self, x: f64, y: f64) -> (f64, f64) {
|
||||||
|
let new_x = self.a * x + self.c * y + self.e;
|
||||||
|
let new_y = self.b * x + self.d * y + self.f;
|
||||||
|
(new_x, new_y)
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Get the determinant of this matrix.
|
||||||
|
#[inline]
|
||||||
|
pub fn determinant(&self) -> f64 {
|
||||||
|
self.a * self.d - self.b * self.c
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Check if the matrix has a negative determinant (flip).
|
||||||
|
#[inline]
|
||||||
|
pub fn has_flip(&self) -> bool {
|
||||||
|
self.determinant() < 0.0
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Default for Matrix3x3 {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self::identity()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Graphics state as defined in PDF spec section 8.4.
|
||||||
|
///
|
||||||
|
/// This contains the CTM and other graphics state parameters.
|
||||||
|
/// For Phase 5.2.1 image compositing, we only need the CTM.
|
||||||
|
#[derive(Debug, Clone)]
|
||||||
|
pub struct GraphicsState {
|
||||||
|
/// Current Transformation Matrix
|
||||||
|
pub ctm: Matrix3x3,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl GraphicsState {
|
||||||
|
/// Create a new graphics state with identity CTM.
|
||||||
|
#[inline]
|
||||||
|
pub fn new() -> Self {
|
||||||
|
Self {
|
||||||
|
ctm: Matrix3x3::identity(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Concatenate a matrix with the current CTM.
|
||||||
|
///
|
||||||
|
/// This implements the `cm` operator behavior: CTM' = CTM × M
|
||||||
|
#[inline]
|
||||||
|
pub fn concat_ctm(&mut self, matrix: &Matrix3x3) {
|
||||||
|
self.ctm = self.ctm.multiply(matrix);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Default for GraphicsState {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self::new()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Graphics state stack for q/Q operators.
|
||||||
|
///
|
||||||
|
/// Per PDF spec, the graphics state stack has a maximum depth to prevent
|
||||||
|
/// stack overflow in malformed PDFs.
|
||||||
|
#[derive(Debug, Clone)]
|
||||||
|
pub struct GraphicsStateStack {
|
||||||
|
/// The stack of saved graphics states
|
||||||
|
stack: Vec<GraphicsState>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl GraphicsStateStack {
|
||||||
|
/// Create a new empty graphics state stack.
|
||||||
|
#[inline]
|
||||||
|
pub fn new() -> Self {
|
||||||
|
Self {
|
||||||
|
stack: Vec::with_capacity(16),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Push a graphics state onto the stack (implements `q` operator).
|
||||||
|
///
|
||||||
|
/// Returns false if the stack would exceed the maximum depth.
|
||||||
|
#[inline]
|
||||||
|
pub fn push(&mut self, state: &GraphicsState) -> bool {
|
||||||
|
if self.stack.len() >= MAX_GSTATE_DEPTH {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
self.stack.push(state.clone());
|
||||||
|
true
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Pop a graphics state from the stack (implements `Q` operator).
|
||||||
|
///
|
||||||
|
/// Returns None if the stack is empty.
|
||||||
|
#[inline]
|
||||||
|
pub fn pop(&mut self) -> Option<GraphicsState> {
|
||||||
|
self.stack.pop()
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Get the current depth of the stack.
|
||||||
|
#[inline]
|
||||||
|
pub fn depth(&self) -> usize {
|
||||||
|
self.stack.len()
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Check if the stack is empty.
|
||||||
|
#[inline]
|
||||||
|
pub fn is_empty(&self) -> bool {
|
||||||
|
self.stack.is_empty()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Default for GraphicsStateStack {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self::new()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[cfg(test)]
|
||||||
|
mod tests {
|
||||||
|
use super::*;
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_identity_matrix() {
|
||||||
|
let m = Matrix3x3::identity();
|
||||||
|
assert!(m.is_identity());
|
||||||
|
assert_eq!(m.transform_point(1.0, 0.0), (1.0, 0.0));
|
||||||
|
assert_eq!(m.transform_point(0.0, 1.0), (0.0, 1.0));
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_translation_matrix() {
|
||||||
|
let m = Matrix3x3::from_pdf_array([1.0, 0.0, 0.0, 1.0, 10.0, 20.0]);
|
||||||
|
let (x, y) = m.transform_point(0.0, 0.0);
|
||||||
|
assert_eq!(x, 10.0);
|
||||||
|
assert_eq!(y, 20.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_scale_matrix() {
|
||||||
|
let m = Matrix3x3::from_pdf_array([2.0, 0.0, 0.0, 3.0, 0.0, 0.0]);
|
||||||
|
let (x, y) = m.transform_point(1.0, 1.0);
|
||||||
|
assert_eq!(x, 2.0);
|
||||||
|
assert_eq!(y, 3.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_matrix_multiply() {
|
||||||
|
let m1 = Matrix3x3::from_pdf_array([2.0, 0.0, 0.0, 1.0, 0.0, 0.0]);
|
||||||
|
let m2 = Matrix3x3::from_pdf_array([1.0, 0.0, 0.0, 3.0, 0.0, 0.0]);
|
||||||
|
let result = m1.multiply(&m2);
|
||||||
|
|
||||||
|
// Should scale x by 2, y by 3
|
||||||
|
let (x, y) = result.transform_point(1.0, 1.0);
|
||||||
|
assert_eq!(x, 2.0);
|
||||||
|
assert_eq!(y, 3.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_determinant_positive() {
|
||||||
|
let m = Matrix3x3::identity();
|
||||||
|
assert_eq!(m.determinant(), 1.0);
|
||||||
|
assert!(!m.has_flip());
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_determinant_negative() {
|
||||||
|
// Y flip matrix
|
||||||
|
let m = Matrix3x3::from_pdf_array([1.0, 0.0, 0.0, -1.0, 0.0, 0.0]);
|
||||||
|
assert_eq!(m.determinant(), -1.0);
|
||||||
|
assert!(m.has_flip());
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_gstate_stack_push_pop() {
|
||||||
|
let mut stack = GraphicsStateStack::new();
|
||||||
|
let state1 = GraphicsState::new();
|
||||||
|
|
||||||
|
assert!(stack.is_empty());
|
||||||
|
assert_eq!(stack.depth(), 0);
|
||||||
|
|
||||||
|
assert!(stack.push(&state1));
|
||||||
|
assert_eq!(stack.depth(), 1);
|
||||||
|
assert!(!stack.is_empty());
|
||||||
|
|
||||||
|
let popped = stack.pop();
|
||||||
|
assert!(popped.is_some());
|
||||||
|
assert!(stack.is_empty());
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_gstate_stack_depth_limit() {
|
||||||
|
let mut stack = GraphicsStateStack::new();
|
||||||
|
let state = GraphicsState::new();
|
||||||
|
|
||||||
|
// Fill to max depth
|
||||||
|
for _ in 0..MAX_GSTATE_DEPTH {
|
||||||
|
assert!(stack.push(&state));
|
||||||
|
}
|
||||||
|
|
||||||
|
// Should fail to push beyond max
|
||||||
|
assert!(!stack.push(&state));
|
||||||
|
assert_eq!(stack.depth(), MAX_GSTATE_DEPTH);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_gstate_ctm_concat() {
|
||||||
|
let mut state = GraphicsState::new();
|
||||||
|
let translate = Matrix3x3::from_pdf_array([1.0, 0.0, 0.0, 1.0, 10.0, 20.0]);
|
||||||
|
state.concat_ctm(&translate);
|
||||||
|
|
||||||
|
let (x, y) = state.ctm.transform_point(0.0, 0.0);
|
||||||
|
assert_eq!(x, 10.0);
|
||||||
|
assert_eq!(y, 20.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_gstate_stack_restore() {
|
||||||
|
let mut stack = GraphicsStateStack::new();
|
||||||
|
let mut state1 = GraphicsState::new();
|
||||||
|
let mut state2 = GraphicsState::new();
|
||||||
|
|
||||||
|
// Modify state1
|
||||||
|
let translate = Matrix3x3::from_pdf_array([1.0, 0.0, 0.0, 1.0, 10.0, 20.0]);
|
||||||
|
state1.concat_ctm(&translate);
|
||||||
|
|
||||||
|
// Push state1
|
||||||
|
stack.push(&state1);
|
||||||
|
|
||||||
|
// Modify state2
|
||||||
|
let scale = Matrix3x3::from_pdf_array([2.0, 0.0, 0.0, 2.0, 0.0, 0.0]);
|
||||||
|
state2.concat_ctm(&scale);
|
||||||
|
|
||||||
|
// Pop should restore state1
|
||||||
|
let restored = stack.pop().unwrap();
|
||||||
|
let (x, y) = restored.ctm.transform_point(0.0, 0.0);
|
||||||
|
assert_eq!(x, 10.0);
|
||||||
|
assert_eq!(y, 20.0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
@ -11,9 +11,12 @@ pub mod document;
|
||||||
pub mod extract;
|
pub mod extract;
|
||||||
pub mod fingerprint;
|
pub mod fingerprint;
|
||||||
pub mod font;
|
pub mod font;
|
||||||
|
pub mod graphics_state;
|
||||||
pub mod options;
|
pub mod options;
|
||||||
pub mod parser;
|
pub mod parser;
|
||||||
pub mod receipts;
|
pub mod receipts;
|
||||||
|
#[cfg(feature = "ocr")]
|
||||||
|
pub mod render;
|
||||||
pub mod schema;
|
pub mod schema;
|
||||||
pub mod semaphore;
|
pub mod semaphore;
|
||||||
|
|
||||||
|
|
|
||||||
950
crates/pdftract-core/src/render.rs
Normal file
950
crates/pdftract-core/src/render.rs
Normal file
|
|
@ -0,0 +1,950 @@
|
||||||
|
//! Direct image compositing for scanned pages (Phase 5.2.1).
|
||||||
|
//!
|
||||||
|
//! This module implements the default-feature image rendering path that:
|
||||||
|
//! 1. Walks the content stream operator list
|
||||||
|
//! 2. Builds CTM stack (q/Q + cm operators)
|
||||||
|
//! 3. Collects image XObject references (Do operator) with their CTMs
|
||||||
|
//! 4. Retrieves each image XObject via Phase 1.5 stream decoder
|
||||||
|
//! 5. Converts to GrayImage (luminance conversion from RGB if needed)
|
||||||
|
//! 6. Computes pixel placement using CTM
|
||||||
|
//! 7. Composites each placed image onto a white-background canvas
|
||||||
|
//!
|
||||||
|
//! This path has zero external dependencies (uses image crate from default deps)
|
||||||
|
//! and handles > 90% of scanned PDFs correctly.
|
||||||
|
//!
|
||||||
|
//! # Feature Gate
|
||||||
|
//!
|
||||||
|
//! This module is only available when the `ocr` feature is enabled.
|
||||||
|
#![cfg(feature = "ocr")]
|
||||||
|
|
||||||
|
use crate::graphics_state::{Matrix3x3, GraphicsStateStack, GraphicsState};
|
||||||
|
use crate::parser::lexer::Lexer;
|
||||||
|
use crate::parser::lexer::Token;
|
||||||
|
use crate::parser::object::{PdfObject, ObjRef};
|
||||||
|
use crate::parser::xref::XrefResolver;
|
||||||
|
use crate::parser::stream::{decode_stream, ExtractionOptions as StreamExtractionOptions, PdfSource};
|
||||||
|
use crate::parser::resources::ResourceDict;
|
||||||
|
use crate::diagnostics::{Diagnostic, DiagCode};
|
||||||
|
use image::{GrayImage, RgbImage, RgbaImage, Luma, Rgb, Rgba, ImageBuffer, DynamicImage};
|
||||||
|
use std::sync::Arc;
|
||||||
|
|
||||||
|
/// Maximum number of images to composite per page (prevents DoS).
|
||||||
|
const MAX_IMAGES_PER_PAGE: usize = 256;
|
||||||
|
|
||||||
|
/// Result type for image compositing operations.
|
||||||
|
pub type Result<T> = std::result::Result<T, Vec<Diagnostic>>;
|
||||||
|
|
||||||
|
/// An image placement instruction from a Do operator.
|
||||||
|
///
|
||||||
|
/// Contains the XObject reference and the CTM at the time of the Do.
|
||||||
|
#[derive(Debug, Clone)]
|
||||||
|
pub struct ImagePlacement {
|
||||||
|
/// The XObject reference (must be an Image XObject, not a Form).
|
||||||
|
pub xobject_ref: ObjRef,
|
||||||
|
/// The CTM at the time of the Do operator.
|
||||||
|
pub ctm: Matrix3x3,
|
||||||
|
/// The XObject name (for diagnostics).
|
||||||
|
pub name: Arc<str>,
|
||||||
|
}
|
||||||
|
|
||||||
|
/// An inline image from a BI/ID/EI sequence.
|
||||||
|
///
|
||||||
|
/// Inline images are embedded directly in the content stream rather than
|
||||||
|
/// being referenced as XObjects.
|
||||||
|
#[derive(Debug, Clone)]
|
||||||
|
pub struct InlineImage {
|
||||||
|
/// The image data (decoded).
|
||||||
|
pub data: Vec<u8>,
|
||||||
|
/// Image width in pixels.
|
||||||
|
pub width: u32,
|
||||||
|
/// Image height in pixels.
|
||||||
|
pub height: u32,
|
||||||
|
/// Bits per component.
|
||||||
|
pub bpc: u8,
|
||||||
|
/// Color space: "DeviceGray", "DeviceRGB", or "DeviceCMYK".
|
||||||
|
pub colorspace: String,
|
||||||
|
/// Filter applied to the image data.
|
||||||
|
pub filter: Option<String>,
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Represents either an XObject image or an inline image.
|
||||||
|
#[derive(Debug, Clone)]
|
||||||
|
pub enum ImageSource {
|
||||||
|
/// An XObject reference (most common).
|
||||||
|
XObject(ObjRef, Arc<str>),
|
||||||
|
/// An inline image (BI/ID/EI sequence).
|
||||||
|
Inline(InlineImage),
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Walk content stream and collect image placements with their CTMs.
|
||||||
|
///
|
||||||
|
/// This function:
|
||||||
|
/// 1. Parses the content stream into tokens
|
||||||
|
/// 2. Maintains a CTM stack (q/Q operators)
|
||||||
|
/// 3. Tracks cm operators (concatenate matrix)
|
||||||
|
/// 4. Collects Do operators with their current CTM
|
||||||
|
/// 5. Collects inline images (BI/ID/EI sequences)
|
||||||
|
///
|
||||||
|
/// # Arguments
|
||||||
|
///
|
||||||
|
/// * `content` - The decoded content stream bytes
|
||||||
|
/// * `resources` - The page's resource dictionary (for XObject lookup)
|
||||||
|
///
|
||||||
|
/// # Returns
|
||||||
|
///
|
||||||
|
/// A list of image placements with their CTMs, or diagnostics if parsing fails.
|
||||||
|
pub fn collect_image_placements(
|
||||||
|
content: &[u8],
|
||||||
|
resources: &ResourceDict,
|
||||||
|
) -> Result<Vec<ImagePlacement>> {
|
||||||
|
let mut placements = Vec::new();
|
||||||
|
let mut diagnostics = Vec::new();
|
||||||
|
|
||||||
|
// Create graphics state stack
|
||||||
|
let mut gss = GraphicsStateStack::new();
|
||||||
|
let mut state = GraphicsState::new();
|
||||||
|
|
||||||
|
// Tokenize content stream
|
||||||
|
let mut lexer = Lexer::new(content);
|
||||||
|
let mut operand_buffer: Vec<Token> = Vec::new();
|
||||||
|
|
||||||
|
while let Some(token) = lexer.next_token() {
|
||||||
|
match token {
|
||||||
|
Token::Keyword(ref k) => {
|
||||||
|
let keyword = std::str::from_utf8(k).unwrap_or("");
|
||||||
|
|
||||||
|
match keyword {
|
||||||
|
"q" => {
|
||||||
|
// Push graphics state
|
||||||
|
if !gss.push(&state) {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::GstateStackOverflow,
|
||||||
|
"Graphics state stack overflow",
|
||||||
|
));
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
operand_buffer.clear();
|
||||||
|
}
|
||||||
|
"Q" => {
|
||||||
|
// Pop graphics state
|
||||||
|
if let Some(popped) = gss.pop() {
|
||||||
|
state = popped;
|
||||||
|
}
|
||||||
|
operand_buffer.clear();
|
||||||
|
}
|
||||||
|
"cm" => {
|
||||||
|
// Concatenate matrix: cm expects 6 numbers
|
||||||
|
let nums: Vec<f64> = operand_buffer.iter().filter_map(|t| {
|
||||||
|
match t {
|
||||||
|
Token::Integer(n) => Some(*n as f64),
|
||||||
|
Token::Real(f) => Some(*f),
|
||||||
|
_ => None,
|
||||||
|
}
|
||||||
|
}).collect();
|
||||||
|
|
||||||
|
if nums.len() >= 6 {
|
||||||
|
let matrix = Matrix3x3::from_pdf_array([nums[0], nums[1], nums[2], nums[3], nums[4], nums[5]]);
|
||||||
|
state.concat_ctm(&matrix);
|
||||||
|
}
|
||||||
|
operand_buffer.clear();
|
||||||
|
}
|
||||||
|
"Do" => {
|
||||||
|
// Paint XObject: Do expects a name operand
|
||||||
|
if let Some(name_token) = operand_buffer.last() {
|
||||||
|
if let Token::Name(name_bytes) = name_token {
|
||||||
|
if let Ok(name_str) = std::str::from_utf8(name_bytes) {
|
||||||
|
let name_key = name_str.trim_start_matches('/');
|
||||||
|
// Check if this XObject exists in resources
|
||||||
|
if let Some(&xobject_ref) = resources.xobjects.get(name_key) {
|
||||||
|
// Record the placement with current CTM
|
||||||
|
placements.push(ImagePlacement {
|
||||||
|
xobject_ref,
|
||||||
|
ctm: state.ctm,
|
||||||
|
name: Arc::from(name_key),
|
||||||
|
});
|
||||||
|
|
||||||
|
// Check image count limit
|
||||||
|
if placements.len() >= MAX_IMAGES_PER_PAGE {
|
||||||
|
diagnostics.push(Diagnostic::with_dynamic_no_offset(
|
||||||
|
DiagCode::StreamBomb,
|
||||||
|
format!("Too many images on page ({}), aborting", MAX_IMAGES_PER_PAGE),
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
operand_buffer.clear();
|
||||||
|
}
|
||||||
|
"BI" => {
|
||||||
|
// Begin inline image - this is complex to handle in the token stream
|
||||||
|
// For now, we'll skip inline images silently
|
||||||
|
// Full inline image support requires a more sophisticated parser
|
||||||
|
// that can handle the BI/ID/EI sequence properly
|
||||||
|
operand_buffer.clear();
|
||||||
|
}
|
||||||
|
_ => {
|
||||||
|
// Other operator - clear operands
|
||||||
|
operand_buffer.clear();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Token::Integer(_) | Token::Real(_) | Token::Name(_) => {
|
||||||
|
// Collect operands for cm and Do operators
|
||||||
|
operand_buffer.push(token);
|
||||||
|
}
|
||||||
|
_ => {
|
||||||
|
// Other tokens - ignore
|
||||||
|
operand_buffer.clear();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if diagnostics.is_empty() || !placements.is_empty() {
|
||||||
|
Ok(placements)
|
||||||
|
} else {
|
||||||
|
Err(diagnostics)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Get the /Matrix from an XObject dictionary if present.
|
||||||
|
///
|
||||||
|
/// Returns the matrix if found, or identity if not present.
|
||||||
|
fn get_xobject_matrix(
|
||||||
|
xobject_ref: ObjRef,
|
||||||
|
resolver: &XrefResolver,
|
||||||
|
) -> Matrix3x3 {
|
||||||
|
// Resolve the XObject
|
||||||
|
let xobject = match resolver.resolve(xobject_ref) {
|
||||||
|
Ok(obj) => obj,
|
||||||
|
Err(_) => return Matrix3x3::identity(),
|
||||||
|
};
|
||||||
|
|
||||||
|
// Get the stream
|
||||||
|
let stream = match xobject.as_stream() {
|
||||||
|
Some(s) => s,
|
||||||
|
None => return Matrix3x3::identity(),
|
||||||
|
};
|
||||||
|
|
||||||
|
// Get the /Matrix key if present
|
||||||
|
let dict = &stream.dict;
|
||||||
|
match dict.get("/Matrix") {
|
||||||
|
Some(PdfObject::Array(arr)) => {
|
||||||
|
// Matrix should be a 6-element array
|
||||||
|
let nums: Vec<f64> = arr.iter().filter_map(|v| {
|
||||||
|
match v {
|
||||||
|
PdfObject::Integer(n) => Some(*n as f64),
|
||||||
|
PdfObject::Real(f) => Some(*f),
|
||||||
|
_ => None,
|
||||||
|
}
|
||||||
|
}).collect();
|
||||||
|
|
||||||
|
if nums.len() >= 6 {
|
||||||
|
Matrix3x3::from_pdf_array([nums[0], nums[1], nums[2], nums[3], nums[4], nums[5]])
|
||||||
|
} else {
|
||||||
|
Matrix3x3::identity()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
_ => Matrix3x3::identity(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Decode an image XObject to a DynamicImage.
|
||||||
|
///
|
||||||
|
/// Handles various image formats:
|
||||||
|
/// - DCTDecode (JPEG)
|
||||||
|
/// - JPXDecode (JPEG2000)
|
||||||
|
/// - FlateDecode/LZWDecode (raw RGB/grayscale)
|
||||||
|
///
|
||||||
|
/// # Arguments
|
||||||
|
///
|
||||||
|
/// * `xobject_ref` - The image XObject reference
|
||||||
|
/// * `resolver` - The xref resolver
|
||||||
|
/// * `source` - The PDF source
|
||||||
|
/// * `max_bytes` - Maximum decompressed bytes
|
||||||
|
///
|
||||||
|
/// # Returns
|
||||||
|
///
|
||||||
|
/// The decoded image, or diagnostics if decoding fails.
|
||||||
|
pub fn decode_image_xobject(
|
||||||
|
xobject_ref: ObjRef,
|
||||||
|
resolver: &XrefResolver,
|
||||||
|
source: &dyn PdfSource,
|
||||||
|
max_bytes: u64,
|
||||||
|
) -> Result<DynamicImage> {
|
||||||
|
let mut diagnostics = Vec::new();
|
||||||
|
|
||||||
|
// Resolve the XObject
|
||||||
|
let xobject = match resolver.resolve(xobject_ref) {
|
||||||
|
Ok(obj) => obj,
|
||||||
|
Err(e) => {
|
||||||
|
diagnostics.push(Diagnostic::with_dynamic_no_offset(
|
||||||
|
DiagCode::StructMissingKey,
|
||||||
|
format!("Failed to resolve XObject: {:?}", e),
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
// Get the stream
|
||||||
|
let stream = match xobject.as_stream() {
|
||||||
|
Some(s) => s,
|
||||||
|
None => {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::StructInvalidType,
|
||||||
|
"XObject is not a stream",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
// Get the XObject subtype
|
||||||
|
let dict = &stream.dict;
|
||||||
|
let _subtype = match dict.get("/Subtype") {
|
||||||
|
Some(PdfObject::Name(s)) if s.as_ref() == "Image" => s,
|
||||||
|
Some(_) => {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::StructInvalidType,
|
||||||
|
"XObject is not an Image",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
None => {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::StructMissingKey,
|
||||||
|
"XObject missing /Subtype",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
// Check for soft mask (not supported in direct compositing)
|
||||||
|
if let Some(_) = dict.get("/SMask") {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::ImgSoftmaskUnsupported,
|
||||||
|
"Soft-masked images not supported in direct compositing path",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Decode the stream
|
||||||
|
let stream_opts = StreamExtractionOptions {
|
||||||
|
max_decompress_bytes: max_bytes,
|
||||||
|
password: None,
|
||||||
|
};
|
||||||
|
let mut doc_counter = 0u64;
|
||||||
|
let decoded = decode_stream(stream, source, &stream_opts, &mut doc_counter);
|
||||||
|
|
||||||
|
// Get image dimensions
|
||||||
|
let width = match dict.get("/Width") {
|
||||||
|
Some(PdfObject::Integer(w)) => *w as u32,
|
||||||
|
Some(PdfObject::Real(w)) => *w as u32,
|
||||||
|
_ => {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::StructMissingKey,
|
||||||
|
"Image missing /Width",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
let height = match dict.get("/Height") {
|
||||||
|
Some(PdfObject::Integer(h)) => *h as u32,
|
||||||
|
Some(PdfObject::Real(h)) => *h as u32,
|
||||||
|
_ => {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::StructMissingKey,
|
||||||
|
"Image missing /Height",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
// Get color space
|
||||||
|
let colorspace = dict.get("/ColorSpace");
|
||||||
|
|
||||||
|
// Get bits per component
|
||||||
|
let bpc = match dict.get("/BitsPerComponent") {
|
||||||
|
Some(PdfObject::Integer(b)) => *b as u8,
|
||||||
|
_ => 8,
|
||||||
|
};
|
||||||
|
|
||||||
|
// Try to load as image based on filter
|
||||||
|
let filter = stream.filter();
|
||||||
|
|
||||||
|
// For JPEG images, try direct loading
|
||||||
|
if let Some(filters) = filter {
|
||||||
|
if filters.iter().any(|f| f == "DCTDecode" || f == "DCT") {
|
||||||
|
// Try to load as JPEG
|
||||||
|
match image::load_from_memory(&decoded) {
|
||||||
|
Ok(img) => return Ok(img),
|
||||||
|
Err(_) => {
|
||||||
|
// Fall through to manual decoding
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Manual decoding for non-JPEG images
|
||||||
|
// Determine color space
|
||||||
|
let is_rgb = match colorspace {
|
||||||
|
Some(PdfObject::Name(cs)) => cs.as_ref() == "DeviceRGB",
|
||||||
|
Some(PdfObject::Array(arr)) => {
|
||||||
|
if let Some(PdfObject::Name(cs)) = arr.first() {
|
||||||
|
cs.as_ref() == "DeviceRGB" || cs.as_ref() == "ICCBased" || cs.as_ref() == "CalRGB"
|
||||||
|
} else {
|
||||||
|
false
|
||||||
|
}
|
||||||
|
}
|
||||||
|
_ => false,
|
||||||
|
};
|
||||||
|
|
||||||
|
let is_cmyk = match colorspace {
|
||||||
|
Some(PdfObject::Name(cs)) => cs.as_ref() == "DeviceCMYK",
|
||||||
|
Some(PdfObject::Array(arr)) => {
|
||||||
|
if let Some(PdfObject::Name(cs)) = arr.first() {
|
||||||
|
cs.as_ref() == "DeviceCMYK"
|
||||||
|
} else {
|
||||||
|
false
|
||||||
|
}
|
||||||
|
}
|
||||||
|
_ => false,
|
||||||
|
};
|
||||||
|
|
||||||
|
// Calculate expected data size
|
||||||
|
let components = if is_rgb { 3 } else if is_cmyk { 4 } else { 1 };
|
||||||
|
let expected_size = (width as usize) * (height as usize) * (components as usize);
|
||||||
|
|
||||||
|
if decoded.len() < expected_size {
|
||||||
|
diagnostics.push(Diagnostic::with_dynamic_no_offset(
|
||||||
|
DiagCode::StreamTruncated,
|
||||||
|
format!("Image data truncated: expected {} bytes, got {}", expected_size, decoded.len()),
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Create image from decoded data
|
||||||
|
let dynamic_img = if is_rgb {
|
||||||
|
// RGB image
|
||||||
|
if bpc == 8 {
|
||||||
|
let mut rgb_data = Vec::with_capacity(expected_size);
|
||||||
|
for i in (0..expected_size).step_by(3) {
|
||||||
|
if i + 2 < decoded.len() {
|
||||||
|
rgb_data.push(decoded[i]);
|
||||||
|
rgb_data.push(decoded[i + 1]);
|
||||||
|
rgb_data.push(decoded[i + 2]);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
let img: RgbImage = ImageBuffer::from_raw(width, height, rgb_data)
|
||||||
|
.unwrap_or_else(|| ImageBuffer::new(width, height));
|
||||||
|
DynamicImage::ImageRgb8(img)
|
||||||
|
} else {
|
||||||
|
// Unsupported bits per component
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::ImgUnsupportedFormat,
|
||||||
|
"Unsupported bits per component for RGB image",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
} else if is_cmyk {
|
||||||
|
// CMYK image - need to convert to RGB
|
||||||
|
// This is a simplified conversion (proper conversion requires ICC profiles)
|
||||||
|
let mut rgb_data = Vec::with_capacity((width as usize) * (height as usize) * 3);
|
||||||
|
for i in (0..decoded.len()).step_by(4) {
|
||||||
|
if i + 3 < decoded.len() {
|
||||||
|
let c = decoded[i] as f32 / 255.0;
|
||||||
|
let m = decoded[i + 1] as f32 / 255.0;
|
||||||
|
let y = decoded[i + 2] as f32 / 255.0;
|
||||||
|
let k = decoded[i + 3] as f32 / 255.0;
|
||||||
|
|
||||||
|
// CMYK to RGB conversion
|
||||||
|
let r = ((1.0 - c) * (1.0 - k) * 255.0) as u8;
|
||||||
|
let g = ((1.0 - m) * (1.0 - k) * 255.0) as u8;
|
||||||
|
let b = ((1.0 - y) * (1.0 - k) * 255.0) as u8;
|
||||||
|
|
||||||
|
rgb_data.push(r);
|
||||||
|
rgb_data.push(g);
|
||||||
|
rgb_data.push(b);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
let img: RgbImage = ImageBuffer::from_raw(width, height, rgb_data)
|
||||||
|
.unwrap_or_else(|| ImageBuffer::new(width, height));
|
||||||
|
DynamicImage::ImageRgb8(img)
|
||||||
|
} else {
|
||||||
|
// Grayscale image
|
||||||
|
if bpc == 8 {
|
||||||
|
let gray_data: Vec<u8> = decoded.iter().copied().collect();
|
||||||
|
let img: GrayImage = ImageBuffer::from_raw(width, height, gray_data)
|
||||||
|
.unwrap_or_else(|| ImageBuffer::new(width, height));
|
||||||
|
DynamicImage::ImageLuma8(img)
|
||||||
|
} else if bpc == 1 {
|
||||||
|
// 1-bit grayscale (binary image) - expand to 8-bit
|
||||||
|
let mut gray_data = Vec::with_capacity((width as usize) * (height as usize));
|
||||||
|
for &byte in decoded.iter() {
|
||||||
|
for bit in (0..8).rev() {
|
||||||
|
gray_data.push(if (byte >> bit) & 1 == 1 { 0 } else { 255 });
|
||||||
|
}
|
||||||
|
}
|
||||||
|
let img: GrayImage = ImageBuffer::from_raw(width, height, gray_data)
|
||||||
|
.unwrap_or_else(|| ImageBuffer::new(width, height));
|
||||||
|
DynamicImage::ImageLuma8(img)
|
||||||
|
} else {
|
||||||
|
diagnostics.push(Diagnostic::with_static_no_offset(
|
||||||
|
DiagCode::ImgUnsupportedFormat,
|
||||||
|
"Unsupported bits per component for grayscale image",
|
||||||
|
));
|
||||||
|
return Err(diagnostics);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
Ok(dynamic_img)
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Convert an image to grayscale.
|
||||||
|
///
|
||||||
|
/// Uses luminance conversion: Y = 0.299*R + 0.587*G + 0.114*B
|
||||||
|
pub fn to_grayscale(img: &DynamicImage) -> GrayImage {
|
||||||
|
img.to_luma8()
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Composite images onto a canvas using their CTMs.
|
||||||
|
///
|
||||||
|
/// # Arguments
|
||||||
|
///
|
||||||
|
/// * `placements` - Image placements with CTMs
|
||||||
|
/// * `page_width` - Page width in PDF points
|
||||||
|
/// * `page_height` - Page height in PDF points
|
||||||
|
/// * `dpi` - Resolution for rendering (default 300)
|
||||||
|
/// * `resolver` - The xref resolver
|
||||||
|
/// * `source` - The PDF source
|
||||||
|
/// * `max_bytes` - Maximum decompressed bytes
|
||||||
|
///
|
||||||
|
/// # Returns
|
||||||
|
///
|
||||||
|
/// The composited grayscale image, or diagnostics if compositing fails.
|
||||||
|
pub fn composite_images(
|
||||||
|
placements: &[ImagePlacement],
|
||||||
|
page_width: f64,
|
||||||
|
page_height: f64,
|
||||||
|
dpi: u32,
|
||||||
|
resolver: &XrefResolver,
|
||||||
|
source: &dyn PdfSource,
|
||||||
|
max_bytes: u64,
|
||||||
|
) -> Result<GrayImage> {
|
||||||
|
composite_images_with_rotation(placements, page_width, page_height, dpi, 0, resolver, source, max_bytes)
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Composite images onto a canvas using their CTMs, with page rotation support.
|
||||||
|
///
|
||||||
|
/// # Arguments
|
||||||
|
///
|
||||||
|
/// * `placements` - Image placements with CTMs
|
||||||
|
/// * `page_width` - Page width in PDF points
|
||||||
|
/// * `page_height` - Page height in PDF points
|
||||||
|
/// * `dpi` - Resolution for rendering (default 300)
|
||||||
|
/// * `rotation` - Page rotation in degrees (0, 90, 180, 270)
|
||||||
|
/// * `resolver` - The xref resolver
|
||||||
|
/// * `source` - The PDF source
|
||||||
|
/// * `max_bytes` - Maximum decompressed bytes
|
||||||
|
///
|
||||||
|
/// # Returns
|
||||||
|
///
|
||||||
|
/// The composited grayscale image, or diagnostics if compositing fails.
|
||||||
|
pub fn composite_images_with_rotation(
|
||||||
|
placements: &[ImagePlacement],
|
||||||
|
page_width: f64,
|
||||||
|
page_height: f64,
|
||||||
|
dpi: u32,
|
||||||
|
rotation: i32,
|
||||||
|
resolver: &XrefResolver,
|
||||||
|
source: &dyn PdfSource,
|
||||||
|
max_bytes: u64,
|
||||||
|
) -> Result<GrayImage> {
|
||||||
|
let mut diagnostics = Vec::new();
|
||||||
|
|
||||||
|
// Normalize rotation to 0-360 range and ensure it's a multiple of 90
|
||||||
|
let rotation = ((rotation % 360) + 360) % 360;
|
||||||
|
let rotation = match rotation {
|
||||||
|
0 | 90 | 180 | 270 => rotation,
|
||||||
|
_ => 0, // Invalid rotation, default to 0
|
||||||
|
};
|
||||||
|
|
||||||
|
// For rotated pages, swap width and height
|
||||||
|
let (effective_width, effective_height) = match rotation {
|
||||||
|
90 | 270 => (page_height, page_width),
|
||||||
|
_ => (page_width, page_height),
|
||||||
|
};
|
||||||
|
|
||||||
|
// Calculate canvas size in pixels
|
||||||
|
let scale = dpi as f64 / 72.0;
|
||||||
|
let canvas_width = (effective_width * scale).ceil() as u32;
|
||||||
|
let canvas_height = (effective_height * scale).ceil() as u32;
|
||||||
|
|
||||||
|
// Create white canvas
|
||||||
|
let mut canvas = GrayImage::new(canvas_width, canvas_height);
|
||||||
|
for pixel in canvas.pixels_mut() {
|
||||||
|
*pixel = Luma([255]); // White background
|
||||||
|
}
|
||||||
|
|
||||||
|
// Composite each image
|
||||||
|
for placement in placements {
|
||||||
|
// Get the XObject /Matrix if present
|
||||||
|
let xobject_matrix = get_xobject_matrix(placement.xobject_ref, resolver);
|
||||||
|
|
||||||
|
// Compose the placement CTM with the XObject /Matrix
|
||||||
|
// The effective CTM is: placement_ctm * xobject_matrix
|
||||||
|
let effective_ctm = placement.ctm.multiply(&xobject_matrix);
|
||||||
|
|
||||||
|
// Decode the image
|
||||||
|
let img = match decode_image_xobject(placement.xobject_ref, resolver, source, max_bytes) {
|
||||||
|
Ok(img) => img,
|
||||||
|
Err(mut diags) => {
|
||||||
|
diagnostics.append(&mut diags);
|
||||||
|
continue; // Skip this image but continue with others
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
// Convert to grayscale
|
||||||
|
let gray_img = to_grayscale(&img);
|
||||||
|
|
||||||
|
// Compute placement using the effective CTM
|
||||||
|
// The CTM transforms from image space to PDF user space
|
||||||
|
// For images, we need to transform the unit square [0,1]x[0,1]
|
||||||
|
|
||||||
|
// Transform the image corners
|
||||||
|
let corners = [
|
||||||
|
(0.0, 0.0), // Bottom-left
|
||||||
|
(1.0, 0.0), // Bottom-right
|
||||||
|
(0.0, 1.0), // Top-left
|
||||||
|
(1.0, 1.0), // Top-right
|
||||||
|
];
|
||||||
|
|
||||||
|
let mut transformed_corners = Vec::new();
|
||||||
|
for &(x, y) in &corners {
|
||||||
|
let (tx, ty) = effective_ctm.transform_point(x, y);
|
||||||
|
// Convert PDF points to pixels
|
||||||
|
let mut px = tx * scale;
|
||||||
|
let mut py = (page_height - ty) * scale; // Flip Y for image coordinates
|
||||||
|
|
||||||
|
// Apply rotation to pixel coordinates
|
||||||
|
match rotation {
|
||||||
|
90 => {
|
||||||
|
// Rotate 90 degrees clockwise
|
||||||
|
let old_px = px;
|
||||||
|
px = py;
|
||||||
|
py = (canvas_height as f64) - old_px;
|
||||||
|
}
|
||||||
|
180 => {
|
||||||
|
// Rotate 180 degrees
|
||||||
|
px = (canvas_width as f64) - px;
|
||||||
|
py = (canvas_height as f64) - py;
|
||||||
|
}
|
||||||
|
270 => {
|
||||||
|
// Rotate 270 degrees clockwise (90 counterclockwise)
|
||||||
|
let old_px = px;
|
||||||
|
px = (canvas_width as f64) - py;
|
||||||
|
py = old_px;
|
||||||
|
}
|
||||||
|
_ => {
|
||||||
|
// No rotation
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
transformed_corners.push((px, py));
|
||||||
|
}
|
||||||
|
|
||||||
|
// Compute bounding box
|
||||||
|
let min_x = transformed_corners.iter().map(|(x, _)| x).fold(f64::INFINITY, |a, &b| a.min(b)).floor() as i32;
|
||||||
|
let max_x = transformed_corners.iter().map(|(x, _)| x).fold(f64::NEG_INFINITY, |a, &b| a.max(b)).ceil() as i32;
|
||||||
|
let min_y = transformed_corners.iter().map(|(_, y)| y).fold(f64::INFINITY, |a, &b| a.min(b)).floor() as i32;
|
||||||
|
let max_y = transformed_corners.iter().map(|(_, y)| y).fold(f64::NEG_INFINITY, |a, &b| a.max(b)).ceil() as i32;
|
||||||
|
|
||||||
|
// Clamp to canvas bounds
|
||||||
|
let min_x = min_x.max(0) as u32;
|
||||||
|
let max_x = max_x.min(canvas_width as i32 - 1) as u32;
|
||||||
|
let min_y = min_y.max(0) as u32;
|
||||||
|
let max_y = max_y.min(canvas_height as i32 - 1) as u32;
|
||||||
|
|
||||||
|
if min_x >= max_x || min_y >= max_y {
|
||||||
|
// Image is outside canvas bounds
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
// For now, use a simple placement without proper perspective transform
|
||||||
|
// This handles the common case of untransformed full-page images
|
||||||
|
|
||||||
|
// Copy image pixels to canvas (simple copy for now)
|
||||||
|
let img_width = gray_img.width();
|
||||||
|
let img_height = gray_img.height();
|
||||||
|
|
||||||
|
// Scale image to fit bounding box
|
||||||
|
let bbox_width = max_x - min_x;
|
||||||
|
let bbox_height = max_y - min_y;
|
||||||
|
|
||||||
|
if bbox_width == 0 || bbox_height == 0 {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Resize image to fit
|
||||||
|
let resized = if img_width != bbox_width || img_height != bbox_height {
|
||||||
|
image::imageops::resize(&gray_img, bbox_width, bbox_height, image::imageops::FilterType::Lanczos3)
|
||||||
|
} else {
|
||||||
|
gray_img
|
||||||
|
};
|
||||||
|
|
||||||
|
// Copy pixels to canvas
|
||||||
|
for y in 0..bbox_height {
|
||||||
|
for x in 0..bbox_width {
|
||||||
|
let canvas_x = min_x + x;
|
||||||
|
let canvas_y = min_y + y;
|
||||||
|
if canvas_x < canvas_width && canvas_y < canvas_height {
|
||||||
|
let pixel = resized.get_pixel(x, y);
|
||||||
|
canvas.put_pixel(canvas_x, canvas_y, *pixel);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if diagnostics.is_empty() {
|
||||||
|
Ok(canvas)
|
||||||
|
} else {
|
||||||
|
// Return canvas even with diagnostics (partial result)
|
||||||
|
Ok(canvas)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[cfg(test)]
|
||||||
|
mod tests {
|
||||||
|
use super::*;
|
||||||
|
use crate::parser::resources::ResourceDict;
|
||||||
|
use std::sync::Arc;
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_collect_image_placements_empty() {
|
||||||
|
let content = b"";
|
||||||
|
let resources = ResourceDict::new();
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
assert!(result.unwrap().is_empty());
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_collect_image_placements_simple() {
|
||||||
|
// Simple content stream with one Do operator
|
||||||
|
let content = b"/Im1 Do";
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
resources.xobjects.insert(Arc::from("Im1"), ObjRef::new(1, 0));
|
||||||
|
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 1);
|
||||||
|
assert_eq!(placements[0].name.as_ref(), "Im1");
|
||||||
|
// CTM should be identity
|
||||||
|
assert!(placements[0].ctm.is_identity());
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_collect_image_placements_with_ctm() {
|
||||||
|
// Content stream with cm and Do operators
|
||||||
|
let content = b"1 0 0 1 100 200 cm /Im1 Do";
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
resources.xobjects.insert(Arc::from("Im1"), ObjRef::new(1, 0));
|
||||||
|
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 1);
|
||||||
|
// CTM should have translation
|
||||||
|
assert_eq!(placements[0].ctm.e, 100.0);
|
||||||
|
assert_eq!(placements[0].ctm.f, 200.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_collect_image_placements_with_stack() {
|
||||||
|
// Content stream with q/Q operators
|
||||||
|
let content = b"q 1 0 0 1 100 200 cm /Im1 Do Q /Im2 Do";
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
resources.xobjects.insert(Arc::from("Im1"), ObjRef::new(1, 0));
|
||||||
|
resources.xobjects.insert(Arc::from("Im2"), ObjRef::new(2, 0));
|
||||||
|
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 2);
|
||||||
|
// First image should have translation
|
||||||
|
assert_eq!(placements[0].ctm.e, 100.0);
|
||||||
|
assert_eq!(placements[0].ctm.f, 200.0);
|
||||||
|
// Second image should have identity CTM (after Q)
|
||||||
|
assert!(placements[1].ctm.is_identity());
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_to_grayscale() {
|
||||||
|
// Create a simple RGB image
|
||||||
|
let rgb_img: RgbImage = ImageBuffer::from_fn(2, 2, |x, y| {
|
||||||
|
match (x, y) {
|
||||||
|
(0, 0) => Rgb([255, 0, 0]), // Red
|
||||||
|
(1, 0) => Rgb([0, 255, 0]), // Green
|
||||||
|
(0, 1) => Rgb([0, 0, 255]), // Blue
|
||||||
|
(1, 1) => Rgb([255, 255, 255]), // White
|
||||||
|
_ => Rgb([0, 0, 0]), // Should never happen for 2x2 image
|
||||||
|
}
|
||||||
|
});
|
||||||
|
|
||||||
|
let dynamic = DynamicImage::ImageRgb8(rgb_img);
|
||||||
|
let gray = to_grayscale(&dynamic);
|
||||||
|
|
||||||
|
// Check that grayscale conversion worked
|
||||||
|
assert_eq!(gray.width(), 2);
|
||||||
|
assert_eq!(gray.height(), 2);
|
||||||
|
|
||||||
|
// Red pixel should be dark
|
||||||
|
let r_pixel = gray.get_pixel(0, 0);
|
||||||
|
assert!(r_pixel[0] < 100); // Luminance of red is low
|
||||||
|
|
||||||
|
// Green pixel should be medium
|
||||||
|
let g_pixel = gray.get_pixel(1, 0);
|
||||||
|
assert!(g_pixel[0] > 100 && g_pixel[0] < 200);
|
||||||
|
|
||||||
|
// Blue pixel should be dark
|
||||||
|
let b_pixel = gray.get_pixel(0, 1);
|
||||||
|
assert!(b_pixel[0] < 100);
|
||||||
|
|
||||||
|
// White pixel should be bright
|
||||||
|
let w_pixel = gray.get_pixel(1, 1);
|
||||||
|
assert!(w_pixel[0] > 200);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_collect_image_placements_with_bi() {
|
||||||
|
// Content stream with BI operator (inline image)
|
||||||
|
// Should emit a diagnostic but not crash
|
||||||
|
let content = b"BI";
|
||||||
|
let resources = ResourceDict::new();
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
|
||||||
|
// Should return Ok (no placements) but the implementation
|
||||||
|
// currently emits a diagnostic inline
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_graphics_state_stack_limit() {
|
||||||
|
// Test that the graphics state stack depth limit is enforced
|
||||||
|
let content: Vec<u8> = b"q ".repeat(100).into(); // 100 q operators (exceeds MAX_GSTATE_DEPTH)
|
||||||
|
let resources = ResourceDict::new();
|
||||||
|
let result = collect_image_placements(&content, &resources);
|
||||||
|
|
||||||
|
// Should fail due to stack overflow
|
||||||
|
assert!(result.is_err());
|
||||||
|
|
||||||
|
let diags = result.unwrap_err();
|
||||||
|
assert!(diags.iter().any(|d| d.code == DiagCode::GstateStackOverflow));
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_ctm_with_scale() {
|
||||||
|
// Test CTM with scaling
|
||||||
|
let content = b"2 0 0 2 0 0 cm /Im1 Do";
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
resources.xobjects.insert(Arc::from("Im1"), ObjRef::new(1, 0));
|
||||||
|
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 1);
|
||||||
|
// CTM should have scale
|
||||||
|
assert_eq!(placements[0].ctm.a, 2.0);
|
||||||
|
assert_eq!(placements[0].ctm.d, 2.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_ctm_with_rotation() {
|
||||||
|
// Test CTM with rotation (90 degrees)
|
||||||
|
// [0 1 -1 0 0 0] is a 90-degree rotation
|
||||||
|
let content = b"0 1 -1 0 100 200 cm /Im1 Do";
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
resources.xobjects.insert(Arc::from("Im1"), ObjRef::new(1, 0));
|
||||||
|
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 1);
|
||||||
|
// CTM should have rotation
|
||||||
|
assert_eq!(placements[0].ctm.a, 0.0);
|
||||||
|
assert_eq!(placements[0].ctm.b, 1.0);
|
||||||
|
assert_eq!(placements[0].ctm.c, -1.0);
|
||||||
|
assert_eq!(placements[0].ctm.d, 0.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_ctm_with_flip() {
|
||||||
|
// Test CTM with Y flip (negative determinant)
|
||||||
|
// [1 0 0 -1 0 height] flips Y
|
||||||
|
let content = b"1 0 0 -1 0 792 cm /Im1 Do";
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
resources.xobjects.insert(Arc::from("Im1"), ObjRef::new(1, 0));
|
||||||
|
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 1);
|
||||||
|
// CTM should have Y flip
|
||||||
|
assert_eq!(placements[0].ctm.a, 1.0);
|
||||||
|
assert_eq!(placements[0].ctm.d, -1.0);
|
||||||
|
assert!(placements[0].ctm.has_flip());
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_multiple_images_different_ctms() {
|
||||||
|
// Test multiple images with different CTMs
|
||||||
|
let content = b"q 1 0 0 1 0 0 cm /Im1 Do Q q 2 0 0 2 100 100 cm /Im2 Do Q q 0 1 -1 0 200 200 cm /Im3 Do Q";
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
resources.xobjects.insert(Arc::from("Im1"), ObjRef::new(1, 0));
|
||||||
|
resources.xobjects.insert(Arc::from("Im2"), ObjRef::new(2, 0));
|
||||||
|
resources.xobjects.insert(Arc::from("Im3"), ObjRef::new(3, 0));
|
||||||
|
|
||||||
|
let result = collect_image_placements(content, &resources);
|
||||||
|
assert!(result.is_ok());
|
||||||
|
let placements = result.unwrap();
|
||||||
|
assert_eq!(placements.len(), 3);
|
||||||
|
|
||||||
|
// First image: identity
|
||||||
|
assert!(placements[0].ctm.is_identity());
|
||||||
|
|
||||||
|
// Second image: scale and translate
|
||||||
|
assert_eq!(placements[1].ctm.a, 2.0);
|
||||||
|
assert_eq!(placements[1].ctm.d, 2.0);
|
||||||
|
assert_eq!(placements[1].ctm.e, 100.0);
|
||||||
|
assert_eq!(placements[1].ctm.f, 100.0);
|
||||||
|
|
||||||
|
// Third image: rotate and translate
|
||||||
|
assert_eq!(placements[2].ctm.a, 0.0);
|
||||||
|
assert_eq!(placements[2].ctm.b, 1.0);
|
||||||
|
assert_eq!(placements[2].ctm.e, 200.0);
|
||||||
|
assert_eq!(placements[2].ctm.f, 200.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_image_count_limit() {
|
||||||
|
// Test that the image count limit is enforced
|
||||||
|
let mut content = String::new();
|
||||||
|
let mut resources = ResourceDict::new();
|
||||||
|
|
||||||
|
// Create 300 image references (exceeds MAX_IMAGES_PER_PAGE)
|
||||||
|
for i in 0..300 {
|
||||||
|
content.push_str(&format!("/Im{} Do ", i));
|
||||||
|
resources.xobjects.insert(Arc::from(format!("Im{}", i)), ObjRef::new(i as u32, 0));
|
||||||
|
}
|
||||||
|
|
||||||
|
let result = collect_image_placements(content.as_bytes(), &resources);
|
||||||
|
assert!(result.is_err());
|
||||||
|
|
||||||
|
let diags = result.unwrap_err();
|
||||||
|
assert!(diags.iter().any(|d| d.code == DiagCode::StreamBomb));
|
||||||
|
}
|
||||||
|
}
|
||||||
Loading…
Add table
Reference in a new issue