This commit is contained in:
23
docs/snippets/rust/config/tesseract_config.md
Normal file
23
docs/snippets/rust/config/tesseract_config.md
Normal file
@@ -0,0 +1,23 @@
|
||||
```rust title="Rust"
|
||||
use kreuzberg::{extract_file_sync, ExtractionConfig, OcrConfig};
|
||||
use kreuzberg::types::TesseractConfig;
|
||||
|
||||
fn main() -> kreuzberg::Result<()> {
|
||||
let config = ExtractionConfig {
|
||||
ocr: Some(OcrConfig {
|
||||
backend: "tesseract".to_string(),
|
||||
language: "eng+deu".to_string(),
|
||||
tesseract_config: Some(TesseractConfig {
|
||||
psm: Some(6),
|
||||
oem: Some(3),
|
||||
..Default::default()
|
||||
}),
|
||||
}),
|
||||
..Default::default()
|
||||
};
|
||||
|
||||
let result = extract_file_sync("scanned.pdf", None::<&str>, &config)?;
|
||||
println!("OCR text: {}", result.content);
|
||||
Ok(())
|
||||
}
|
||||
```
|
||||
Reference in New Issue
Block a user