This commit is contained in:
26
docs/snippets/elixir/utils/vector_database_integration.md
Normal file
26
docs/snippets/elixir/utils/vector_database_integration.md
Normal file
@@ -0,0 +1,26 @@
|
||||
<!-- snippet:syntax-only -->
|
||||
|
||||
```elixir
|
||||
config_json =
|
||||
Jason.encode!(%{
|
||||
"chunking" => %{
|
||||
"max_characters" => 512,
|
||||
"overlap" => 50,
|
||||
"embedding" => %{
|
||||
"model" => %{"preset" => %{"name" => "balanced"}},
|
||||
"normalize" => true
|
||||
}
|
||||
}
|
||||
})
|
||||
|
||||
{:ok, json} = Kreuzberg.extract_file_async("document.pdf", nil, config_json)
|
||||
result = Jason.decode!(json)
|
||||
|
||||
(result["chunks"] || [])
|
||||
|> Enum.with_index()
|
||||
|> Enum.each(fn {chunk, i} ->
|
||||
chunk_id = "doc_chunk_#{i}"
|
||||
preview = String.slice(chunk["content"] || "", 0, 50)
|
||||
IO.puts("Chunk #{chunk_id}: #{preview}")
|
||||
end)
|
||||
```
|
||||
Reference in New Issue
Block a user