Files
fil/docs/snippets/php/getting-started/extract_with_ocr.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

586 B

<?php
declare(strict_types=1);

use Kreuzberg\Kreuzberg;
use Kreuzberg\ExtractionConfig;
use Kreuzberg\OcrConfig;

$ocrConfig = new OcrConfig();
$ocrConfig->setBackend('tesseract');
$ocrConfig->setLanguage('eng');

$config = new ExtractionConfig();
$config->setForceOcr(true);
$config->setOcr($ocrConfig);

$result = Kreuzberg::extractFileSync('scanned.pdf', null, $config);

echo "Content:\n";
echo $result->getContent();

if ($result->getDetectedLanguages() !== null) {
    echo "Detected Languages: " . implode(', ', $result->getDetectedLanguages()) . "\n";
}