Files
fil/docs/snippets/go/config/advanced_config.md

55 lines
1.1 KiB
Markdown
Raw Permalink Normal View History

2026-06-01 23:40:55 +02:00
```go title="Go"
package main
import (
"fmt"
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
maxChars := uint(1000)
maxOverlap := uint(100)
useCache := true
enableQuality := true
languageDetectionEnabled := true
config := kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
Backend: "tesseract",
Language: "eng+deu",
},
Chunking: &kreuzberg.ChunkingConfig{
MaxCharacters: &maxChars,
Overlap: &maxOverlap,
},
LanguageDetection: &kreuzberg.LanguageDetectionConfig{
Enabled: &languageDetectionEnabled,
DetectMultiple: true,
},
UseCache: &useCache,
EnableQualityProcessing: &enableQuality,
}
result, err := kreuzberg.ExtractFileSync("document.pdf", nil, config)
if err != nil {
log.Fatalf("extract failed: %v", err)
}
// Access chunks
if len(result.Chunks) > 0 {
snippet := result.Chunks[0].Content
if len(snippet) > 100 {
snippet = snippet[:100]
}
fmt.Printf("First chunk: %s...\n", snippet)
}
// Access detected languages
if len(result.DetectedLanguages) > 0 {
fmt.Printf("Languages: %v\n", result.DetectedLanguages)
}
}
```