Files
fil/docs/snippets/csharp/metadata/page_boundaries.md

27 lines
870 B
Markdown
Raw Permalink Normal View History

2026-06-01 23:40:55 +02:00
```csharp title="C#"
using Kreuzberg;
var config = new ExtractionConfig();
var result = KreuzbergLib.ExtractFileSync("document.pdf", null, config);
if (result.Metadata?.Pages?.Boundaries != null)
{
foreach (var boundary in result.Metadata.Pages.Boundaries.Take(3))
{
var pageStart = (int)boundary.ByteStart;
var pageEnd = (int)boundary.ByteEnd;
if (pageEnd > result.Content.Length)
pageEnd = result.Content.Length;
var pageText = result.Content.Substring(pageStart, pageEnd - pageStart);
var previewEnd = Math.Min(100, pageText.Length);
var preview = pageText.Substring(0, previewEnd);
Console.WriteLine($"Page {boundary.PageNumber}:");
Console.WriteLine($" Byte range: {boundary.ByteStart}-{boundary.ByteEnd}");
Console.WriteLine($" Preview: {preview}...");
}
}
```