Files
fil/docs/snippets/dart/ocr/ocr_elements.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

1.1 KiB

import 'package:kreuzberg/kreuzberg.dart';

Future<void> main() async {
  final config = ExtractionConfig(
    useCache: true,
    enableQualityProcessing: true,
    forceOcr: false,
    disableOcr: false,
    ocr: const OcrConfig(
      enabled: true,
      backend: 'paddleocr',
      language: 'en',
      autoRotate: false,
      elementConfig: OcrElementConfig(
        includeElements: true,
        minLevel: OcrElementLevel.word,
        minConfidence: 0.0,
        buildHierarchy: false,
      ),
    ),
    resultFormat: ResultFormat.unified,
    outputFormat: OutputFormat.plain(),
    includeDocumentStructure: false,
    maxArchiveDepth: 3,
    useLayoutForMarkdown: false,
  );

  final result = await KreuzbergBridge.extractFile('scanned.pdf', null, config);
  final elements = result.ocrElements ?? const <OcrElement>[];
  for (final element in elements) {
    print('Text: ${element.text}');
    print('Confidence: ${element.confidence.recognition.toStringAsFixed(2)}');
    print('Level: ${element.level}');
    print('Page: ${element.pageNumber}');
  }
}