Files
fil/docs/snippets/elixir/config/element_based_output.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

960 B

# Configure element-based output
config = %Kreuzberg.ExtractionConfig{
  output_format: :element_based
}

# Extract document
{:ok, result} = Kreuzberg.extract_file_sync("document.pdf", config)

# Access elements
Enum.each(result.elements, fn element ->
  IO.puts("Type: #{element.element_type}")

  text = String.slice(element.text, 0, 100)
  IO.puts("Text: #{text}")

  if element.metadata.page_number do
    IO.puts("Page: #{element.metadata.page_number}")
  end

  if element.metadata.coordinates do
    coords = element.metadata.coordinates
    IO.puts("Coords: (#{coords.left}, #{coords.top}) - (#{coords.right}, #{coords.bottom})")
  end

  IO.puts("---")
end)

# Filter by element type
titles = Enum.filter(result.elements, fn e -> e.element_type == :title end)

Enum.each(titles, fn title ->
  level = Map.get(title.metadata.additional, "level", "unknown")
  IO.puts("[#{level}] #{title.text}")
end)