Files
fil/docs/snippets/elixir/ocr/image_preprocessing.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

456 B

config_json = Jason.encode!(%{
  "ocr" => %{
    "backend" => "tesseract",
    "tesseract_config" => %{
      "preprocessing" => %{
        "target_dpi" => 300,
        "denoise" => true,
        "deskew" => true,
        "contrast_enhance" => true,
        "binarization_method" => "otsu"
      }
    }
  }
})

{:ok, result} = Kreuzberg.extract_file_sync("scanned.pdf", "application/pdf", config_json)
IO.puts(result.content)