Files
fil/docs/snippets/java/config/element_based_output.md
Henrik Jess Nielsen b4c07d3693
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s
Nomad changes
2026-06-01 23:40:55 +02:00

1.9 KiB

import dev.kreuzberg.Kreuzberg;
import dev.kreuzberg.ExtractionConfig;
import dev.kreuzberg.ExtractionResult;
import dev.kreuzberg.Element;
import dev.kreuzberg.ResultFormat;
import java.nio.file.Path;
import java.util.List;

public class ElementBasedOutput {
    public static void main(String[] args) throws Exception {
        // Configure element-based output
        ExtractionConfig config = ExtractionConfig.builder()
            .withResultFormat(ResultFormat.ElementBased)
            .build();

        // Extract document
        ExtractionResult result = Kreuzberg.extractFileSync(Path.of("document.pdf"), config);

        // Access elements
        List<Element> elements = result.elements();
        if (elements != null) {
            for (Element element : elements) {
                System.out.println("Type: " + element.elementType());

                String text = element.text();
                if (text.length() > 100) {
                    text = text.substring(0, 100);
                }
                System.out.println("Text: " + text);

                if (element.metadata().pageNumber() != null) {
                    System.out.println("Page: " + element.metadata().pageNumber());
                }

                if (element.metadata().coordinates() != null) {
                    System.out.println("Coords: " + element.metadata().coordinates());
                }

                System.out.println("---");
            }

            // Filter by element type
            elements.stream()
                .filter(e -> "Title".equalsIgnoreCase(String.valueOf(e.elementType())))
                .forEach(title -> {
                    String level = title.metadata().additional().getOrDefault("level", "unknown");
                    System.out.printf("[%s] %s%n", level, title.text());
                });
        }
    }
}