Files
fil/docs/snippets/csharp/ocr/image_preprocessing.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

664 B

using Kreuzberg;

var config = new ExtractionConfig
{
    Ocr = new OcrConfig
    {
        TesseractConfig = new TesseractConfig
        {
            Preprocessing = new ImagePreprocessingConfig
            {
                TargetDpi = 300,
                Denoise = true,
                Deskew = true,
                ContrastEnhance = true,
                BinarizationMethod = "otsu"
            }
        }
    }
};

var result = KreuzbergLib.ExtractFileSync("scanned.pdf", null, config);

string content = result.Content;
string preview = content.Length > 100 ? content[..100] : content;
Console.WriteLine($"Content: {preview}");