This commit is contained in:
27
docs/snippets/csharp/ocr/image_preprocessing.md
Normal file
27
docs/snippets/csharp/ocr/image_preprocessing.md
Normal file
@@ -0,0 +1,27 @@
|
||||
```csharp title="C#"
|
||||
using Kreuzberg;
|
||||
|
||||
var config = new ExtractionConfig
|
||||
{
|
||||
Ocr = new OcrConfig
|
||||
{
|
||||
TesseractConfig = new TesseractConfig
|
||||
{
|
||||
Preprocessing = new ImagePreprocessingConfig
|
||||
{
|
||||
TargetDpi = 300,
|
||||
Denoise = true,
|
||||
Deskew = true,
|
||||
ContrastEnhance = true,
|
||||
BinarizationMethod = "otsu"
|
||||
}
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
var result = KreuzbergLib.ExtractFileSync("scanned.pdf", null, config);
|
||||
|
||||
string content = result.Content;
|
||||
string preview = content.Length > 100 ? content[..100] : content;
|
||||
Console.WriteLine($"Content: {preview}");
|
||||
```
|
||||
Reference in New Issue
Block a user