Files
fil/docs/snippets/r/plugins/pdf_only_processor.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

596 B

library(kreuzberg)

pdf_only_processor <- function(result) {
  # Gate the processor so it only runs for PDF documents.
  if (is.null(result$mime_type) || result$mime_type != "application/pdf") {
    return(result)
  }
  return(result)
}

register_post_processor("pdf_only", pdf_only_processor)

config <- list(postprocessor = list(enabled = TRUE))
json <- extract_file_sync("document.pdf", "application/pdf", config)
result <- jsonlite::fromJSON(json, simplifyVector = FALSE)

cat(sprintf("Processed PDF: %d characters\n", nchar(result$content)))