{ "document": "../../../test_documents/xml/simple_note.xml", "file_type": "xml", "file_size": 165, "expected_frameworks": ["kreuzberg", "markitdown", "tika", "unstructured"], "metadata": { "description": "Minimal XML note structure with basic text content", "category": "structured" }, "ground_truth": { "text_file": "../../../test_documents/ground_truth/xml/xml_simple.txt", "source": "vision" } }