Files
fil/docs/snippets/php/metadata/page_boundaries.md

30 lines
736 B
Markdown
Raw Permalink Normal View History

2026-06-01 23:40:55 +02:00
```php title="PHP"
<?php declare(strict_types=1);
use Kreuzberg\Kreuzberg;
use Kreuzberg\ExtractionConfig;
use Kreuzberg\PageConfig;
$config = new ExtractionConfig();
$config->pages = new PageConfig(
extractPages: true,
insertPageMarkers: true,
markerFormat: "\n\n=== PAGE {page_num} ===\n\n"
);
$result = Kreuzberg::extract_file_sync("document.pdf", null, $config);
// Content with inline page markers
echo "Full content with markers:\n";
echo $result->content . "\n\n";
// Or access pages separately with boundaries preserved
if ($result->pages !== null) {
foreach ($result->pages as $page) {
echo "--- Page " . $page->page_number . " (boundary) ---\n";
echo $page->content . "\n";
}
}
?>
```