600 B
600 B
config_json =
Jason.encode!(%{
"chunking" => %{
"max_characters" => 512,
"overlap" => 50,
"embedding" => %{
"model" => %{"preset" => %{"name" => "balanced"}},
"normalize" => true
}
}
})
{:ok, json} = Kreuzberg.extract_file_async("document.pdf", nil, config_json)
result = Jason.decode!(json)
(result["chunks"] || [])
|> Enum.with_index()
|> Enum.each(fn {chunk, i} ->
chunk_id = "doc_chunk_#{i}"
preview = String.slice(chunk["content"] || "", 0, 50)
IO.puts("Chunk #{chunk_id}: #{preview}")
end)