{ "document": "../../../../test_documents/vendored/unstructured/doc/fake-doc-emphasized-text.doc", "file_type": "doc", "file_size": 27648, "expected_frameworks": ["kreuzberg", "tika", "unstructured"], "metadata": { "description": "Document from unstructured test suite", "source": "unstructured", "size_category": "small" }, "ground_truth": { "text_file": "../../../../test_documents/ground_truth/doc/fake-doc-emphasized-text.txt", "source": "pandoc", "markdown_file": "../../../../test_documents/ground_truth/doc/fake-doc-emphasized-text.md" } }