302 B
302 B
from kreuzberg import extract_bytes_sync, ExtractionConfig
with open("document.pdf", "rb") as f:
content = f.read()
result = extract_bytes_sync(content, "application/pdf", config=ExtractionConfig())
print(result.content[:200])
print(f"Tables: {len(result.tables)}")