Files
fil/docs/snippets/python/plugins/plugin_validator.md

35 lines
812 B
Markdown
Raw Permalink Normal View History

2026-06-01 23:40:55 +02:00
```python title="Python"
from kreuzberg import (
ExtractionResult,
ValidationError,
extract_file_sync,
register_validator,
)
class MinLengthValidator:
def name(self) -> str:
return "min_length"
def version(self) -> str:
return "1.0.0"
def validate(self, result: ExtractionResult) -> None:
if len(result.content) < 50:
raise ValidationError(f"Content too short: {len(result.content)}")
def should_validate(self, result: ExtractionResult) -> bool:
return True
def initialize(self) -> None:
pass
def shutdown(self) -> None:
pass
validator: MinLengthValidator = MinLengthValidator()
register_validator(validator)
result = extract_file_sync("document.pdf")
print(f"Content length: {len(result.content)}")
```