Files
fil/docs/snippets/rust/config/tesseract_config.md

24 lines
673 B
Markdown
Raw Permalink Normal View History

2026-06-01 23:40:55 +02:00
```rust title="Rust"
use kreuzberg::{extract_file_sync, ExtractionConfig, OcrConfig};
use kreuzberg::types::TesseractConfig;
fn main() -> kreuzberg::Result<()> {
let config = ExtractionConfig {
ocr: Some(OcrConfig {
backend: "tesseract".to_string(),
language: "eng+deu".to_string(),
tesseract_config: Some(TesseractConfig {
psm: Some(6),
oem: Some(3),
..Default::default()
}),
}),
..Default::default()
};
let result = extract_file_sync("scanned.pdf", None::<&str>, &config)?;
println!("OCR text: {}", result.content);
Ok(())
}
```