This commit is contained in:
21
docs/snippets/elixir/utils/embedding_with_chunking.md
Normal file
21
docs/snippets/elixir/utils/embedding_with_chunking.md
Normal file
@@ -0,0 +1,21 @@
|
||||
<!-- snippet:syntax-only -->
|
||||
|
||||
```elixir
|
||||
config_json =
|
||||
Jason.encode!(%{
|
||||
"chunking" => %{
|
||||
"max_characters" => 1024,
|
||||
"overlap" => 100,
|
||||
"embedding" => %{
|
||||
"model" => %{"preset" => %{"name" => "balanced"}},
|
||||
"normalize" => true,
|
||||
"batch_size" => 32,
|
||||
"show_download_progress" => false
|
||||
}
|
||||
}
|
||||
})
|
||||
|
||||
{:ok, json} = Kreuzberg.extract_file_async("document.pdf", nil, config_json)
|
||||
result = Jason.decode!(json)
|
||||
IO.puts("chunks: #{length(result["chunks"] || [])}")
|
||||
```
|
||||
Reference in New Issue
Block a user