Files
fil/docs/snippets/dart/getting-started/extract_with_ocr.md

29 lines
711 B
Markdown
Raw Normal View History

2026-06-01 23:40:55 +02:00
```dart title="Dart"
import 'package:kreuzberg/kreuzberg.dart';
Future<void> main() async {
final ocr = OcrConfig(
enabled: true,
backend: 'tesseract',
language: 'eng',
autoRotate: false,
);
final config = ExtractionConfig(
useCache: true,
enableQualityProcessing: true,
forceOcr: true,
disableOcr: false,
resultFormat: ResultFormat.unified,
outputFormat: OutputFormat.plain(),
includeDocumentStructure: false,
maxArchiveDepth: 3,
useLayoutForMarkdown: false, ocr: ocr,
);
final result = await KreuzbergBridge.extractFile('scanned.pdf', null, config);
print(result.content);
print('Detected languages: ${result.detectedLanguages}');
}
```