This commit is contained in:
26
docs/snippets/php/metadata/page_tracking_basic.md
Normal file
26
docs/snippets/php/metadata/page_tracking_basic.md
Normal file
@@ -0,0 +1,26 @@
|
||||
```php title="PHP"
|
||||
<?php declare(strict_types=1);
|
||||
|
||||
use Kreuzberg\Kreuzberg;
|
||||
use Kreuzberg\ExtractionConfig;
|
||||
use Kreuzberg\PageConfig;
|
||||
|
||||
$config = new ExtractionConfig();
|
||||
$config->pages = new PageConfig(
|
||||
extractPages: true,
|
||||
insertPageMarkers: false,
|
||||
markerFormat: "\n\n<!-- PAGE {page_num} -->\n\n"
|
||||
);
|
||||
|
||||
$result = Kreuzberg::extract_file_sync("document.pdf", null, $config);
|
||||
|
||||
if ($result->pages !== null) {
|
||||
foreach ($result->pages as $page) {
|
||||
echo "Page " . $page->page_number . ":\n";
|
||||
echo " Content: " . strlen($page->content) . " chars\n";
|
||||
echo " Tables: " . count($page->tables ?? []) . "\n";
|
||||
echo " Images: " . count($page->images ?? []) . "\n";
|
||||
}
|
||||
}
|
||||
?>
|
||||
```
|
||||
Reference in New Issue
Block a user