Files
fil/docs/snippets/php/metadata/page_tracking_basic.md

27 lines
714 B
Markdown
Raw Normal View History

2026-06-01 23:40:55 +02:00
```php title="PHP"
<?php declare(strict_types=1);
use Kreuzberg\Kreuzberg;
use Kreuzberg\ExtractionConfig;
use Kreuzberg\PageConfig;
$config = new ExtractionConfig();
$config->pages = new PageConfig(
extractPages: true,
insertPageMarkers: false,
markerFormat: "\n\n<!-- PAGE {page_num} -->\n\n"
);
$result = Kreuzberg::extract_file_sync("document.pdf", null, $config);
if ($result->pages !== null) {
foreach ($result->pages as $page) {
echo "Page " . $page->page_number . ":\n";
echo " Content: " . strlen($page->content) . " chars\n";
echo " Tables: " . count($page->tables ?? []) . "\n";
echo " Images: " . count($page->images ?? []) . "\n";
}
}
?>
```