Nomad changes
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s

This commit is contained in:
Henrik Jess Nielsen
2026-06-01 23:40:55 +02:00
parent 72b1a0a6ed
commit b4c07d3693
5723 changed files with 1130655 additions and 0 deletions

View File

@@ -0,0 +1,25 @@
```go title="Go"
package main
import (
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
// The Go binding does not currently expose plugin OCR backend registration.
// Use one of the built-in backends ("tesseract", "paddle-ocr", or VLM via "vlm").
func main() {
result, err := kreuzberg.ExtractFileSync("scanned.pdf", nil, kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
Backend: "tesseract",
Language: "eng",
},
})
if err != nil {
log.Fatalf("extract failed: %v", err)
}
log.Println("content length:", len(result.Content))
}
```

View File

@@ -0,0 +1,32 @@
```go title="Go"
package main
import (
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
extractImages := true
injectPlaceholders := true
autoAdjustDpi := true
targetDpi := int32(200)
maxDim := int32(2048)
result, err := kreuzberg.ExtractFileSync("document.pdf", nil, kreuzberg.ExtractionConfig{
Images: &kreuzberg.ImageExtractionConfig{
ExtractImages: &extractImages,
TargetDpi: &targetDpi,
MaxImageDimension: &maxDim,
InjectPlaceholders: &injectPlaceholders, // set to false to extract images without markdown references
AutoAdjustDpi: &autoAdjustDpi,
},
})
if err != nil {
log.Fatalf("extract failed: %v", err)
}
log.Println("content length:", len(result.Content))
}
```

View File

@@ -0,0 +1,36 @@
```go title="Go"
package main
import (
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
targetDpi := int32(300)
deskew := true
binarization := "otsu"
config := kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
TesseractConfig: &kreuzberg.TesseractConfig{
Preprocessing: &kreuzberg.ImagePreprocessingConfig{
TargetDpi: &targetDpi,
Denoise: true,
Deskew: &deskew,
ContrastEnhance: true,
BinarizationMethod: &binarization,
},
},
},
}
result, err := kreuzberg.ExtractFileSync("document.pdf", nil, config)
if err != nil {
log.Fatalf("extract failed: %v", err)
}
log.Println("content length:", len(result.Content))
}
```

View File

@@ -0,0 +1 @@
EasyOCR is only available in Python.

View File

@@ -0,0 +1,34 @@
```go title="Go"
package main
import (
"fmt"
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
cfg := kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
Backend: "paddle-ocr",
Language: "en",
},
}
result, err := kreuzberg.ExtractFileSync("scanned.pdf", nil, cfg)
if err != nil {
log.Fatalf("extract failed: %v", err)
}
for _, element := range result.OcrElements {
fmt.Printf("Text: %s\n", element.Text)
fmt.Printf("Confidence: %.2f\n", element.Confidence.Recognition)
fmt.Printf("Geometry: %+v\n", element.Geometry)
if element.Rotation != nil {
fmt.Printf("Rotation: %.1f°\n", element.Rotation.AngleDegrees)
}
fmt.Println()
}
}
```

View File

@@ -0,0 +1,24 @@
```go title="Go"
package main
import (
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
cfg := kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
Backend: "tesseract",
Language: "eng",
},
}
result, err := kreuzberg.ExtractFileSync("scanned.pdf", nil, cfg)
if err != nil {
log.Fatalf("extract failed: %v", err)
}
log.Println(len(result.Content))
}
```

View File

@@ -0,0 +1,24 @@
```go title="Go"
package main
import (
"fmt"
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
result, err := kreuzberg.ExtractFileSync("document.pdf", nil, kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
Backend: "tesseract",
},
ForceOcr: true,
})
if err != nil {
log.Fatalf("extract failed: %v", err)
}
fmt.Println(result.Content)
}
```

View File

@@ -0,0 +1,23 @@
```go title="Go"
package main
import (
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
result, err := kreuzberg.ExtractFileSync("multilingual.pdf", nil, kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
Backend: "tesseract",
Language: "eng+deu+fra",
},
})
if err != nil {
log.Fatalf("extract failed: %v", err)
}
log.Println(result.Content)
}
```

View File

@@ -0,0 +1,24 @@
```go title="Go"
package main
import (
"log"
"github.com/kreuzberg-dev/kreuzberg/packages/go/v5"
)
func main() {
cfg := kreuzberg.ExtractionConfig{
Ocr: &kreuzberg.OcrConfig{
Backend: "paddle-ocr",
Language: "en",
},
}
result, err := kreuzberg.ExtractFileSync("scanned.pdf", nil, cfg)
if err != nil {
log.Fatalf("extract failed: %v", err)
}
log.Println(len(result.Content))
}
```