[[bench]]
harness = false
name = "extractor"
path = "benches/extractor.rs"
required-features = []
[build-dependencies.flate2]
version = "1.0.33"
[build-dependencies.fs_extra]
version = "1.3.0"
[build-dependencies.reqwest]
features = ["blocking", "json"]
version = "0.12.7"
[build-dependencies.tar]
version = "0.4.41"
[build-dependencies.walkdir]
version = "2.5.0"
[build-dependencies.zip]
version = "2.2.0"
[dependencies.bytemuck]
version = "1.17.1"
[dependencies.jni]
features = ["invocation"]
version = "0.21.1"
[dependencies.libc]
version = "0.2.158"
[dependencies.strum]
version = "0.26.2"
[dependencies.strum_macros]
version = "0.26.2"
[dependencies.thiserror]
version = "1.0.63"
[dev-dependencies.criterion]
version = "0.5.1"
[dev-dependencies.quick-xml]
version = "0.37.1"
[dev-dependencies.serde]
features = ["derive"]
version = "1.0"
[dev-dependencies.serde_json]
version = "1.0"
[dev-dependencies.test-case]
version = "3.0"
[dev-dependencies.textdistance]
version = "1.1.0"
[[example]]
name = "extract_to_stream"
path = "examples/extract_to_stream.rs"
[[example]]
name = "extract_to_string"
path = "examples/extract_to_string.rs"
[lib]
name = "extractous"
path = "src/lib.rs"
[package]
authors = ["Yobix AI <dev@yobix.ai>"]
autobenches = false
autobins = false
autoexamples = false
autolib = false
autotests = false
build = "build.rs"
categories = ["parsing", "text-processing"]
description = """
Extractous provides a fast and efficient way to extract content from all kind of file formats including PDF, Word, Excel
CSV, Email etc... Internally it uses a natively compiled Apache Tika for formats are not supported natively by the Rust
core
"""
edition = "2021"
homepage = "https://extractous.yobix.ai"
keywords = ["unstructured", "tika", "text", "pdf", "parser"]
license = "Apache-2.0"
name = "extractous"
readme = "README.md"
repository = "https://github.com/yobix-ai/extractous"
version = "0.3.0"
[profile.release]
lto = "thin"
opt-level = 3
rpath = true
[[test]]
name = "extract_to_stream_tests"
path = "tests/extract_to_stream_tests.rs"
[[test]]
name = "extract_to_string_tests"
path = "tests/extract_to_string_tests.rs"
[[test]]
name = "extract_to_xml_tests"
path = "tests/extract_to_xml_tests.rs"
[[test]]
name = "test_utils"
path = "tests/test_utils.rs"