14 lines
319 B
C#
14 lines
319 B
C#
|
|
using Kreuzberg;
|
||
|
|
|
||
|
|
var config = new ExtractionConfig
|
||
|
|
{
|
||
|
|
UseCache = true,
|
||
|
|
Postprocessor = new PostProcessorConfig
|
||
|
|
{
|
||
|
|
Enabled = true,
|
||
|
|
EnabledProcessors = new List<string> { "normalize_whitespace", "remove_diacritics" }
|
||
|
|
}
|
||
|
|
};
|
||
|
|
|
||
|
|
var result = KreuzbergLib.ExtractFileSync("document.pdf", config);
|