586 B
586 B
<?php
declare(strict_types=1);
use Kreuzberg\Kreuzberg;
use Kreuzberg\ExtractionConfig;
use Kreuzberg\OcrConfig;
$ocrConfig = new OcrConfig();
$ocrConfig->setBackend('tesseract');
$ocrConfig->setLanguage('eng');
$config = new ExtractionConfig();
$config->setForceOcr(true);
$config->setOcr($ocrConfig);
$result = Kreuzberg::extractFileSync('scanned.pdf', null, $config);
echo "Content:\n";
echo $result->getContent();
if ($result->getDetectedLanguages() !== null) {
echo "Detected Languages: " . implode(', ', $result->getDetectedLanguages()) . "\n";
}