This commit is contained in:
15
docs/snippets/ruby/getting-started/basic_usage.md
Normal file
15
docs/snippets/ruby/getting-started/basic_usage.md
Normal file
@@ -0,0 +1,15 @@
|
||||
```ruby title="Ruby"
|
||||
require 'kreuzberg'
|
||||
|
||||
result = Kreuzberg.extract_file_sync('document.pdf')
|
||||
|
||||
puts "Content:"
|
||||
puts result.content
|
||||
|
||||
puts "\nMetadata:"
|
||||
puts "Title: #{result.metadata&.dig('title')}"
|
||||
puts "Author: #{result.metadata&.dig('author')}"
|
||||
|
||||
puts "\nTables found: #{result.tables.length}"
|
||||
puts "Images found: #{result.images.length}"
|
||||
```
|
||||
14
docs/snippets/ruby/getting-started/extract_file.md
Normal file
14
docs/snippets/ruby/getting-started/extract_file.md
Normal file
@@ -0,0 +1,14 @@
|
||||
```ruby title="Ruby"
|
||||
require 'kreuzberg'
|
||||
|
||||
config = Kreuzberg::ExtractionConfig.new(
|
||||
use_cache: true,
|
||||
enable_quality_processing: true
|
||||
)
|
||||
|
||||
result = Kreuzberg.extract_file_sync('contract.pdf', config: config)
|
||||
|
||||
puts "Extracted #{result.content.length} characters"
|
||||
puts "Quality score: #{result.quality_score}"
|
||||
puts "Processing time: #{result.metadata&.dig('processing_time')}ms"
|
||||
```
|
||||
15
docs/snippets/ruby/getting-started/extract_with_ocr.md
Normal file
15
docs/snippets/ruby/getting-started/extract_with_ocr.md
Normal file
@@ -0,0 +1,15 @@
|
||||
```ruby title="Ruby"
|
||||
require 'kreuzberg'
|
||||
|
||||
ocr_config = Kreuzberg::OcrConfig.new(
|
||||
backend: 'tesseract',
|
||||
language: 'eng'
|
||||
)
|
||||
|
||||
config = Kreuzberg::ExtractionConfig.new(ocr: ocr_config)
|
||||
result = Kreuzberg.extract_file_sync('scanned.pdf', config: config)
|
||||
|
||||
puts "Extracted text from scanned document:"
|
||||
puts result.content
|
||||
puts "Used OCR backend: tesseract"
|
||||
```
|
||||
7
docs/snippets/ruby/getting-started/hello_world.md
Normal file
7
docs/snippets/ruby/getting-started/hello_world.md
Normal file
@@ -0,0 +1,7 @@
|
||||
```ruby title="Ruby"
|
||||
require 'kreuzberg'
|
||||
|
||||
result = Kreuzberg.extract_file_sync('document.pdf')
|
||||
puts "Extracted content:"
|
||||
puts result.content[0...200]
|
||||
```
|
||||
9
docs/snippets/ruby/getting-started/install_verify.md
Normal file
9
docs/snippets/ruby/getting-started/install_verify.md
Normal file
@@ -0,0 +1,9 @@
|
||||
```ruby title="Ruby"
|
||||
require 'kreuzberg'
|
||||
|
||||
puts "Kreuzberg version: #{Kreuzberg::VERSION}"
|
||||
puts "FFI bindings loaded successfully"
|
||||
|
||||
result = Kreuzberg.extract_file_sync('sample.pdf')
|
||||
puts "Installation verified! Extracted #{result.content.length} characters"
|
||||
```
|
||||
15
docs/snippets/ruby/getting-started/read_content.md
Normal file
15
docs/snippets/ruby/getting-started/read_content.md
Normal file
@@ -0,0 +1,15 @@
|
||||
```ruby title="Ruby"
|
||||
require 'kreuzberg'
|
||||
|
||||
result = Kreuzberg.extract_file_sync('document.pdf')
|
||||
|
||||
content = result.content
|
||||
tables = result.tables
|
||||
images = result.images
|
||||
metadata = result.metadata
|
||||
|
||||
puts "Content: #{content.length} characters"
|
||||
puts "Tables: #{tables.length}"
|
||||
puts "Images: #{images.length}"
|
||||
puts "Metadata keys: #{metadata&.keys&.join(', ')}"
|
||||
```
|
||||
Reference in New Issue
Block a user