Files
fil/docs/snippets/zig/plugins/pdf_only_processor.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

1.8 KiB

const std = @import("std");
const kreuzberg = @import("kreuzberg");

const PdfOnlyProcessor = struct {
    pub fn process(self: *PdfOnlyProcessor, result: [*c]const u8, config: [*c]const u8) !void {
        _ = self;
        _ = result;
        _ = config;
        // PDF-specific transforms go here. Parse the JSON result, mutate
        // metadata/content, and forward through the pipeline.
    }

    pub fn processing_stage(self: *PdfOnlyProcessor) [*c]const u8 {
        _ = self;
        return "Middle";
    }

    pub fn should_process(self: *PdfOnlyProcessor, result: [*c]const u8, config: [*c]const u8) i32 {
        _ = self;
        _ = config;
        const slice = std.mem.sliceTo(result, 0);
        return if (std.mem.indexOf(u8, slice, "\"mime_type\":\"application/pdf\"") != null) 1 else 0;
    }

    pub fn estimated_duration_ms(self: *PdfOnlyProcessor, result: [*c]const u8) u64 {
        _ = self;
        _ = result;
        return 5;
    }

    pub fn priority(self: *PdfOnlyProcessor) i32 {
        _ = self;
        return 70;
    }
};

pub fn main() !void {
    var instance = PdfOnlyProcessor{};
    var vtable = kreuzberg.make_post_processor_vtable(PdfOnlyProcessor, &instance);

    vtable.name_fn = struct {
        fn thunk(user_data: ?*anyopaque, out_name: ?*?[*c]u8) callconv(.C) void {
            _ = user_data;
            if (out_name) |ptr| ptr.* = @constCast("pdf-only-processor");
        }
    }.thunk;
    vtable.version_fn = struct {
        fn thunk(user_data: ?*anyopaque, out_version: ?*?[*c]u8) callconv(.C) void {
            _ = user_data;
            if (out_version) |ptr| ptr.* = @constCast("1.0.0");
        }
    }.thunk;

    var out_error: ?[*c]u8 = null;
    _ = kreuzberg.register_post_processor("pdf-only-processor", vtable, &instance, &out_error);
}