18 lines
347 B
C#
18 lines
347 B
C#
using Kreuzberg;
|
|
|
|
var config = new ExtractionConfig
|
|
{
|
|
Ocr = new OcrConfig
|
|
{
|
|
Backend = "tesseract",
|
|
Language = "eng+deu+fra",
|
|
TesseractConfig = new TesseractConfig
|
|
{
|
|
Psm = 3
|
|
}
|
|
}
|
|
};
|
|
|
|
var result = KreuzbergLib.ExtractFileSync("document.pdf", config);
|
|
Console.WriteLine(result.Content);
|