Files
fil/docs/snippets/zig/config/config_programmatic.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

1.5 KiB

const std = @import("std");
const kreuzberg = @import("kreuzberg");

pub fn main() !void {
    var gpa = std.heap.GeneralPurposeAllocator(.{}){};
    defer _ = gpa.deinit();
    const allocator = gpa.allocator();

    // Build the config JSON programmatically with std.json.
    var arena = std.heap.ArenaAllocator.init(allocator);
    defer arena.deinit();
    const a = arena.allocator();

    var root = std.json.ObjectMap.init(a);
    try root.put("use_cache", std.json.Value{ .bool = true });
    try root.put("enable_quality_processing", std.json.Value{ .bool = true });

    var ocr = std.json.ObjectMap.init(a);
    try ocr.put("backend", std.json.Value{ .string = "tesseract" });
    try ocr.put("language", std.json.Value{ .string = "eng+deu" });
    try root.put("ocr", std.json.Value{ .object = ocr });

    var chunking = std.json.ObjectMap.init(a);
    try chunking.put("max_characters", std.json.Value{ .integer = 1000 });
    try chunking.put("overlap", std.json.Value{ .integer = 200 });
    try root.put("chunking", std.json.Value{ .object = chunking });

    const config_value = std.json.Value{ .object = root };
    var buffer = std.ArrayList(u8).init(a);
    try std.json.stringify(config_value, .{}, buffer.writer());

    const result_json = try kreuzberg.extract_file_sync("document.pdf", null, buffer.items);
    defer std.heap.c_allocator.free(result_json);

    const stdout = std.io.getStdOut().writer();
    try stdout.print("{s}\n", .{result_json});
}