Files
fil/docs/snippets/elixir/advanced/9_vector_database_integration.exs
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

34 lines
918 B
Elixir

# Vector Database Integration
# This example demonstrates how to prepare document chunks for integration with vector databases
# by configuring chunking and processing the extracted content.
alias Kreuzberg.ExtractionConfig
# Configure extraction with chunking enabled
config = %ExtractionConfig{
chunking: %{
"enabled" => true,
"max_characters" => 512,
"overlap" => 50
}
}
# Extract file with chunking
{:ok, result} = Kreuzberg.extract_file("document.pdf", nil, config)
# Prepare chunks for vector database ingestion
documents = Enum.map(result.chunks || [], fn chunk ->
%{
content: chunk["content"],
metadata: %{
page: chunk["page"],
char_count: String.length(chunk["content"])
}
}
end)
IO.puts("Prepared #{length(documents)} documents for vector DB")
# The documents list can now be sent to your vector database
# Example: documents |> MyVectorDB.index_documents()