Files
fil/docs/snippets/zig/api/error_handling_extract.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

1.2 KiB

const std = @import("std");
const kreuzberg = @import("kreuzberg");

fn extract_text(bytes: []const u8, mime_type: []const u8) ![]u8 {
    const config_json = "{}";
    return kreuzberg.extract_bytes_sync(bytes, mime_type, config_json);
}

pub fn main() !void {
    var gpa = std.heap.GeneralPurposeAllocator(.{}){};
    defer _ = gpa.deinit();
    const allocator = gpa.allocator();

    const bytes = std.fs.cwd().readFileAlloc(allocator, "document.pdf", 64 * 1024 * 1024) catch &[_]u8{};
    defer if (bytes.len > 0) allocator.free(bytes);

    const stderr = std.io.getStdErr().writer();
    const result_json = extract_text(bytes, "application/pdf") catch |err| {
        switch (err) {
            error.UnsupportedFormat => try stderr.print("Format not supported\n", .{}),
            error.Ocr => try stderr.print("OCR failed\n", .{}),
            error.Validation => try stderr.print("Invalid input or configuration\n", .{}),
            else => try stderr.print("Error: {s}\n", .{@errorName(err)}),
        }
        return;
    };
    defer std.heap.c_allocator.free(result_json);

    const stdout = std.io.getStdOut().writer();
    try stdout.print("Extracted {d} bytes of JSON\n", .{result_json.len});
}