30 lines
696 B
Markdown
30 lines
696 B
Markdown
|
|
```csharp title="C#"
|
||
|
|
using Kreuzberg;
|
||
|
|
|
||
|
|
var config = new ExtractionConfig
|
||
|
|
{
|
||
|
|
Ocr = new OcrConfig
|
||
|
|
{
|
||
|
|
Backend = "paddle-ocr",
|
||
|
|
Language = "en"
|
||
|
|
}
|
||
|
|
};
|
||
|
|
|
||
|
|
var result = KreuzbergLib.ExtractFileSync("scanned.pdf", config);
|
||
|
|
|
||
|
|
if (result.OcrElements is not null)
|
||
|
|
{
|
||
|
|
foreach (var element in result.OcrElements)
|
||
|
|
{
|
||
|
|
Console.WriteLine($"Text: {element.Text}");
|
||
|
|
Console.WriteLine($"Confidence: {element.Confidence.Recognition:F2}");
|
||
|
|
Console.WriteLine($"Geometry: {element.Geometry}");
|
||
|
|
if (element.Rotation is not null)
|
||
|
|
{
|
||
|
|
Console.WriteLine($"Rotation: {element.Rotation.Angle}°");
|
||
|
|
}
|
||
|
|
Console.WriteLine();
|
||
|
|
}
|
||
|
|
}
|
||
|
|
```
|