Nomad changes
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s

This commit is contained in:
Henrik Jess Nielsen
2026-06-01 23:40:55 +02:00
parent 72b1a0a6ed
commit b4c07d3693
5723 changed files with 1130655 additions and 0 deletions

View File

@@ -0,0 +1,15 @@
```ruby title="Ruby"
require 'kreuzberg'
result = Kreuzberg.extract_file_sync('document.pdf')
puts "Content:"
puts result.content
puts "\nMetadata:"
puts "Title: #{result.metadata&.dig('title')}"
puts "Author: #{result.metadata&.dig('author')}"
puts "\nTables found: #{result.tables.length}"
puts "Images found: #{result.images.length}"
```

View File

@@ -0,0 +1,14 @@
```ruby title="Ruby"
require 'kreuzberg'
config = Kreuzberg::ExtractionConfig.new(
use_cache: true,
enable_quality_processing: true
)
result = Kreuzberg.extract_file_sync('contract.pdf', config: config)
puts "Extracted #{result.content.length} characters"
puts "Quality score: #{result.quality_score}"
puts "Processing time: #{result.metadata&.dig('processing_time')}ms"
```

View File

@@ -0,0 +1,15 @@
```ruby title="Ruby"
require 'kreuzberg'
ocr_config = Kreuzberg::OcrConfig.new(
backend: 'tesseract',
language: 'eng'
)
config = Kreuzberg::ExtractionConfig.new(ocr: ocr_config)
result = Kreuzberg.extract_file_sync('scanned.pdf', config: config)
puts "Extracted text from scanned document:"
puts result.content
puts "Used OCR backend: tesseract"
```

View File

@@ -0,0 +1,7 @@
```ruby title="Ruby"
require 'kreuzberg'
result = Kreuzberg.extract_file_sync('document.pdf')
puts "Extracted content:"
puts result.content[0...200]
```

View File

@@ -0,0 +1,9 @@
```ruby title="Ruby"
require 'kreuzberg'
puts "Kreuzberg version: #{Kreuzberg::VERSION}"
puts "FFI bindings loaded successfully"
result = Kreuzberg.extract_file_sync('sample.pdf')
puts "Installation verified! Extracted #{result.content.length} characters"
```

View File

@@ -0,0 +1,15 @@
```ruby title="Ruby"
require 'kreuzberg'
result = Kreuzberg.extract_file_sync('document.pdf')
content = result.content
tables = result.tables
images = result.images
metadata = result.metadata
puts "Content: #{content.length} characters"
puts "Tables: #{tables.length}"
puts "Images: #{images.length}"
puts "Metadata keys: #{metadata&.keys&.join(', ')}"
```