Files
fil/docs/snippets/ruby/advanced/chunk_page_mapping.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

498 B

require 'kreuzberg'

config = Kreuzberg::ExtractionConfig.new(
  chunking: Kreuzberg::ChunkingConfig.new(max_characters: 500, overlap: 50),
)

result = Kreuzberg.extract_file_sync('document.pdf', config: config)

result.chunks&.each do |chunk|
  first = chunk.metadata.first_page
  last = chunk.metadata.last_page
  next if first.nil?

  page_range = first == last ? "Page #{first}" : "Pages #{first}-#{last}"
  puts "Chunk: #{chunk.content[0..50]}... (#{page_range})"
end