import type { ExtractionConfig } from "@kreuzberg/wasm"; import { extractBytes, initWasm } from "@kreuzberg/wasm"; async function extractWithOcr() { await initWasm(); const bytes = new Uint8Array(await fetch("scanned.pdf").then((r) => r.arrayBuffer())); const config: ExtractionConfig = { ocr: { backend: "tesseract-wasm", language: "eng", }, }; const result = await extractBytes(bytes, "application/pdf", config); console.log("Extracted text from scanned document:"); console.log(result.content); if (result.detectedLanguages) { console.log("Detected languages:", result.detectedLanguages); } } extractWithOcr().catch(console.error);