Files
fil/docs/snippets/dart/ocr/ocr_elements.md

39 lines
1.1 KiB
Markdown
Raw Permalink Normal View History

2026-06-01 23:40:55 +02:00
```dart title="Dart"
import 'package:kreuzberg/kreuzberg.dart';
Future<void> main() async {
final config = ExtractionConfig(
useCache: true,
enableQualityProcessing: true,
forceOcr: false,
disableOcr: false,
ocr: const OcrConfig(
enabled: true,
backend: 'paddleocr',
language: 'en',
autoRotate: false,
elementConfig: OcrElementConfig(
includeElements: true,
minLevel: OcrElementLevel.word,
minConfidence: 0.0,
buildHierarchy: false,
),
),
resultFormat: ResultFormat.unified,
outputFormat: OutputFormat.plain(),
includeDocumentStructure: false,
maxArchiveDepth: 3,
useLayoutForMarkdown: false,
);
final result = await KreuzbergBridge.extractFile('scanned.pdf', null, config);
final elements = result.ocrElements ?? const <OcrElement>[];
for (final element in elements) {
print('Text: ${element.text}');
print('Confidence: ${element.confidence.recognition.toStringAsFixed(2)}');
print('Level: ${element.level}');
print('Page: ${element.pageNumber}');
}
}
```