{ "document": "../../../test_documents/docx/test_emf_docx.docx", "file_type": "docx", "file_size": 426097, "expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"], "metadata": { "description": "Large formatted DOCX - 416KB document with EMF graphics", "category": "docx-complex", "size_class": "medium" }, "ground_truth": { "text_file": "../../../test_documents/ground_truth/docx/docx_large_formatted.txt", "source": "vision" } }