Files
fil/docs/snippets/rust/advanced/chunk_page_mapping.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

729 B

Use Kreuzberg::{extract_file_sync, ExtractionConfig, ChunkingConfig, PageConfig};

Let config = ExtractionConfig { chunking: Some(ChunkingConfig { max_characters: 500, overlap: 50, ..Default::default() }), pages: Some(PageConfig { extract_pages: true, ..Default::default() }), ..Default::default() };

Let result = extract_file_sync("document.pdf", None, &config)?;

If let Some(chunks) = result.chunks { for chunk in chunks { if let (Some(first), Some(last)) = (chunk.metadata.first_page, chunk.metadata.last_page) { let page_range = if first == last { format!("Page {}", first) } else { format!("Pages {}-{}", first, last) }; println!("Chunk: {}... ({})", chunk.content.chars().take(50).collect::(), page_range); } } }