This commit is contained in:
24
docs/snippets/python/config/keyword_extraction_config.md
Normal file
24
docs/snippets/python/config/keyword_extraction_config.md
Normal file
@@ -0,0 +1,24 @@
|
||||
```python title="Python"
|
||||
import asyncio
|
||||
from kreuzberg import (
|
||||
ExtractionConfig,
|
||||
KeywordConfig,
|
||||
KeywordAlgorithm,
|
||||
extract_file,
|
||||
)
|
||||
|
||||
async def main() -> None:
|
||||
config: ExtractionConfig = ExtractionConfig(
|
||||
keywords=KeywordConfig(
|
||||
algorithm=KeywordAlgorithm.YAKE,
|
||||
max_keywords=10,
|
||||
min_score=0.3,
|
||||
ngram_range=(1, 3),
|
||||
language="en"
|
||||
)
|
||||
)
|
||||
result = await extract_file("document.pdf", config=config)
|
||||
print(f"Content extracted: {len(result.content)} chars")
|
||||
|
||||
asyncio.run(main())
|
||||
```
|
||||
Reference in New Issue
Block a user