Files
fil/docs/snippets/python/advanced/chunk_page_mapping.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

580 B

from kreuzberg import extract_file_sync, ExtractionConfig, ChunkingConfig

config = ExtractionConfig(
    chunking=ChunkingConfig(max_characters=500, overlap=50),
)

result = extract_file_sync("document.pdf", config=config)

if result.chunks:
    for chunk in result.chunks:
        first = chunk.metadata.first_page
        last = chunk.metadata.last_page
        if first is None:
            continue
        page_range = f"Page {first}" if first == last else f"Pages {first}-{last}"
        print(f"Chunk: {chunk.content[:50]}... ({page_range})")