This commit is contained in:
15
tools/benchmark-harness/fixtures/docx_large_formatted.json
Normal file
15
tools/benchmark-harness/fixtures/docx_large_formatted.json
Normal file
@@ -0,0 +1,15 @@
|
||||
{
|
||||
"document": "../../../test_documents/docx/test_emf_docx.docx",
|
||||
"file_type": "docx",
|
||||
"file_size": 426097,
|
||||
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
|
||||
"metadata": {
|
||||
"description": "Large formatted DOCX - 416KB document with EMF graphics",
|
||||
"category": "docx-complex",
|
||||
"size_class": "medium"
|
||||
},
|
||||
"ground_truth": {
|
||||
"text_file": "../../../test_documents/ground_truth/docx/docx_large_formatted.txt",
|
||||
"source": "vision"
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user