This commit is contained in:
23
docs/snippets/elixir/advanced/chunk_page_mapping.md
Normal file
23
docs/snippets/elixir/advanced/chunk_page_mapping.md
Normal file
@@ -0,0 +1,23 @@
|
||||
```elixir title="Elixir"
|
||||
config_json = Jason.encode!(%{
|
||||
"chunking" => %{
|
||||
"enabled" => true,
|
||||
"max_characters" => 1024,
|
||||
"overlap" => 128
|
||||
}
|
||||
})
|
||||
|
||||
{:ok, result} = Kreuzberg.extract_file_sync("document.pdf", "application/pdf", config_json)
|
||||
|
||||
# Map chunks to their source pages
|
||||
chunks_with_pages = result.chunks
|
||||
|> Enum.map(fn chunk ->
|
||||
%{
|
||||
"chunk_id" => chunk["id"],
|
||||
"content" => chunk["content"],
|
||||
"page_number" => chunk["page"]
|
||||
}
|
||||
end)
|
||||
|
||||
IO.inspect(chunks_with_pages, label: "Chunks with Page Mapping")
|
||||
```
|
||||
Reference in New Issue
Block a user