Nomad changes
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s

This commit is contained in:
Henrik Jess Nielsen
2026-06-01 23:40:55 +02:00
parent 72b1a0a6ed
commit b4c07d3693
5723 changed files with 1130655 additions and 0 deletions

View File

@@ -0,0 +1,65 @@
require 'kreuzberg'
# Example 1: Basic YAKE configuration
# Uses YAKE algorithm with default parameters and English stopword filtering
def basic_yake
config = Kreuzberg::ExtractionConfig.new(
keywords: Kreuzberg::KeywordConfig.new(
algorithm: :yake,
max_keywords: 10,
min_score: 0.0,
ngram_range: [1, 3],
language: 'en',
yake_params: nil,
rake_params: nil
)
)
result = Kreuzberg.extract_file('document.pdf', config: config)
puts "Keywords: #{result.keywords}"
end
# Example 2: Advanced YAKE with custom parameters
# Fine-tunes YAKE with custom window size for co-occurrence analysis
def advanced_yake
config = Kreuzberg::ExtractionConfig.new(
keywords: Kreuzberg::KeywordConfig.new(
algorithm: :yake,
max_keywords: 15,
min_score: 0.1,
ngram_range: [1, 2],
language: 'en',
yake_params: Kreuzberg::YakeParams.new(
window_size: 1
),
rake_params: nil
)
)
result = Kreuzberg.extract_file('document.pdf', config: config)
puts "Keywords: #{result.keywords}"
end
# Example 3: RAKE configuration
# Uses RAKE algorithm for rapid keyword extraction with phrase constraints
def rake_config
config = Kreuzberg::ExtractionConfig.new(
keywords: Kreuzberg::KeywordConfig.new(
algorithm: :rake,
max_keywords: 10,
min_score: 5.0,
ngram_range: [1, 3],
language: 'en',
yake_params: nil,
rake_params: Kreuzberg::RakeParams.new(
min_word_length: 1,
max_words_per_phrase: 3
)
)
)
result = Kreuzberg.extract_file('document.pdf', config: config)
puts "Keywords: #{result.keywords}"
end
basic_yake if __FILE__ == $0