Files
fil/docs/snippets/go/ocr/image_preprocessing.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

37 lines
742 B
Markdown

```go title="Go"
package main
import (
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
targetDpi := int32(300)
deskew := true
binarization := "otsu"
config := kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
TesseractConfig: &kreuzberg.TesseractConfig{
Preprocessing: &kreuzberg.ImagePreprocessingConfig{
TargetDpi: &targetDpi,
Denoise: true,
Deskew: &deskew,
ContrastEnhance: true,
BinarizationMethod: &binarization,
},
},
},
}
result, err := kreuzberg.ExtractFileSync("document.pdf", nil, config)
if err != nil {
log.Fatalf("extract failed: %v", err)
}
log.Println("content length:", len(result.Content))
}
```