Files
fil/docs/snippets/kotlin/metadata/page_boundaries.md

25 lines
785 B
Markdown
Raw Normal View History

2026-06-01 23:40:55 +02:00
```kotlin title="Kotlin"
import dev.kreuzberg.*
import java.nio.file.Paths
fun main() {
val config = ExtractionConfig.builder().build()
val result = Kreuzberg.extractFileSync(Paths.get("document.pdf"), null, config)
val pages = result.metadata().pages() ?: return
val boundaries = pages.boundaries() ?: return
val content = result.content()
for (boundary in boundaries.take(3)) {
val start = boundary.byteStart().toInt()
val end = boundary.byteEnd().toInt()
val pageText = content.substring(start, end)
val previewEnd = minOf(100, pageText.length)
println("Page ${boundary.pageNumber()}:")
println(" Byte range: $start-$end")
println(" Preview: ${pageText.substring(0, previewEnd)}...")
}
}
```