This commit is contained in:
44
docs/snippets/csharp/api/combining_all_features.md
Normal file
44
docs/snippets/csharp/api/combining_all_features.md
Normal file
@@ -0,0 +1,44 @@
|
||||
```csharp title="C#"
|
||||
using Kreuzberg;
|
||||
|
||||
var config = new ExtractionConfig
|
||||
{
|
||||
OutputFormat = OutputFormat.Markdown,
|
||||
UseCache = true,
|
||||
Ocr = new OcrConfig
|
||||
{
|
||||
Enabled = true,
|
||||
Backend = OcrBackendType.Tesseract,
|
||||
Languages = ["eng"]
|
||||
},
|
||||
ImageExtraction = new ImageExtractionConfig
|
||||
{
|
||||
Enabled = true,
|
||||
MinImageHeight = 100,
|
||||
MinImageWidth = 100
|
||||
},
|
||||
Chunking = new ChunkingConfig
|
||||
{
|
||||
Enabled = true,
|
||||
ChunkerType = ChunkerType.Text,
|
||||
MaxCharacters = 2000,
|
||||
Overlap = 100
|
||||
},
|
||||
LanguageDetection = new LanguageDetectionConfig
|
||||
{
|
||||
Enabled = true
|
||||
}
|
||||
};
|
||||
|
||||
try
|
||||
{
|
||||
var result = await KreuzbergLib.ExtractFile("document.pdf", null, config);
|
||||
Console.WriteLine($"Content: {result.Content}");
|
||||
Console.WriteLine($"Language: {result.Metadata?.LanguageDetection}");
|
||||
Console.WriteLine($"Format: {result.OutputFormat}");
|
||||
}
|
||||
catch (KreuzbergException ex)
|
||||
{
|
||||
Console.WriteLine($"Extraction error: {ex.Message}");
|
||||
}
|
||||
```
|
||||
Reference in New Issue
Block a user