This commit completes Phase 5.2.2 by integrating the pdfium-render path into serve mode with runtime validation and feature propagation. Changes: - Propagate ocr and full-render features from CLI to pdftract-core - Add full_render parameter to serve mode ExtractParams - Implement runtime validation in build_options(): * Returns BadRequest if full_render requested but PDFium unavailable * Falls back to direct compositing if feature not compiled - Update all three serve handlers to handle Result from build_options() Acceptance Criteria: ✅ cargo build --features ocr,serve,full-render succeeds ✅ cargo build --features ocr,serve (no full-render) succeeds ✅ Runtime fallback: full_render=true with feature absent uses direct path Notes: - Binary size CI gate (140 MB) requires separate CI infrastructure - Soft-mask regression tests require separate fixture work Refs: pdftract-4my Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
97 lines
2.4 KiB
TOML
97 lines
2.4 KiB
TOML
[package]
|
|
name = "pdftract-cli"
|
|
version.workspace = true
|
|
edition.workspace = true
|
|
rust-version.workspace = true
|
|
license.workspace = true
|
|
repository.workspace = true
|
|
publish = true
|
|
|
|
[[bin]]
|
|
name = "pdftract"
|
|
path = "src/main.rs"
|
|
test = true
|
|
|
|
[[bin]]
|
|
name = "generate_lzw_fixtures"
|
|
path = "../../tests/fixtures/generate_lzw_fixtures_main.rs"
|
|
|
|
[lib]
|
|
name = "pdftract_cli"
|
|
path = "src/lib.rs"
|
|
|
|
default-run = "pdftract"
|
|
|
|
[dependencies]
|
|
anyhow = { workspace = true }
|
|
atty = "0.2"
|
|
terminal_size = "0.3"
|
|
async-stream = "0.3"
|
|
axum = { version = "0.7", features = ["json", "multipart"] }
|
|
bytes = "1"
|
|
chrono = { version = "0.4", features = ["serde"] }
|
|
clap = { version = "4.5", features = ["derive"] }
|
|
dirs = "5.0"
|
|
hyper = { version = "1.0", features = ["full"] }
|
|
hyper-util = { version = "0.1", features = ["full"] }
|
|
http-body-util = "0.1"
|
|
humantime = "2.1"
|
|
libloading = { version = "0.8", optional = true }
|
|
lzw = { workspace = true }
|
|
multer = "3"
|
|
pdftract-core = { path = "../pdftract-core" }
|
|
regex = "1.10"
|
|
secrecy = { workspace = true }
|
|
semver = "1.0"
|
|
serde = { workspace = true, features = ["derive"] }
|
|
serde_json = "1.0"
|
|
serde_yaml = { version = "0.9", optional = true }
|
|
sha2 = "0.10"
|
|
termcolor = "1.4"
|
|
schemars = { version = "0.8", features = ["derive"] }
|
|
subtle = "2.6"
|
|
tempfile = "3"
|
|
tera = "1"
|
|
tokio = { version = "1", features = ["full"] }
|
|
tokio-stream = "0.1"
|
|
tower = { version = "0.5", features = ["full"] }
|
|
tower-http = { version = "0.5", features = ["cors", "trace", "limit", "compression-full"] }
|
|
tracing = { workspace = true }
|
|
ureq = { version = "2.9", optional = true }
|
|
uuid = { version = "1.0", features = ["v4", "serde"] }
|
|
walkdir = "2"
|
|
|
|
[target.'cfg(unix)'.dependencies]
|
|
libc = "0.2"
|
|
|
|
[features]
|
|
default = []
|
|
# OCR support via Tesseract
|
|
ocr = ["pdftract-core/ocr"]
|
|
# Full rendering via PDFium (JBIG2, JPEG2000, CCITT decoding)
|
|
full-render = ["dep:libloading", "pdftract-core/full-render"]
|
|
# Remote HTTP source support
|
|
remote = ["dep:ureq"]
|
|
# Document profiles
|
|
profiles = ["dep:serde_yaml"]
|
|
# HTTP serve mode
|
|
serve = []
|
|
# MCP server mode
|
|
mcp = []
|
|
# Inspector web viewer
|
|
inspect = []
|
|
# Folder grep mode
|
|
grep = []
|
|
# Content-addressed cache
|
|
cache = []
|
|
# Visual citation receipts
|
|
receipts = []
|
|
# Markdown output
|
|
markdown = []
|
|
|
|
[dev-dependencies]
|
|
ureq = { version = "2.9", features = ["socks-proxy"] }
|
|
serde_yaml = "0.9"
|
|
jsonschema = "0.18"
|
|
reqwest = { version = "0.12", features = ["blocking", "json", "rustls-tls"], default-features = false }
|
|
schemars = { version = "0.8", features = ["derive"] }
|