This commit is contained in:
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"document": "../../../../test_documents/vendored/unstructured/doc/duplicate-paragraphs.doc",
|
||||
"file_type": "doc",
|
||||
"file_size": 18432,
|
||||
"expected_frameworks": ["kreuzberg", "tika", "unstructured"],
|
||||
"metadata": {
|
||||
"description": "Document from unstructured test suite",
|
||||
"source": "unstructured",
|
||||
"size_category": "small"
|
||||
},
|
||||
"ground_truth": {
|
||||
"text_file": "../../../../test_documents/ground_truth/doc/duplicate-paragraphs.txt",
|
||||
"source": "pandoc",
|
||||
"markdown_file": "../../../../test_documents/ground_truth/doc/duplicate-paragraphs.md"
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"document": "../../../../test_documents/vendored/unstructured/doc/fake-doc-emphasized-text.doc",
|
||||
"file_type": "doc",
|
||||
"file_size": 27648,
|
||||
"expected_frameworks": ["kreuzberg", "tika", "unstructured"],
|
||||
"metadata": {
|
||||
"description": "Document from unstructured test suite",
|
||||
"source": "unstructured",
|
||||
"size_category": "small"
|
||||
},
|
||||
"ground_truth": {
|
||||
"text_file": "../../../../test_documents/ground_truth/doc/fake-doc-emphasized-text.txt",
|
||||
"source": "pandoc",
|
||||
"markdown_file": "../../../../test_documents/ground_truth/doc/fake-doc-emphasized-text.md"
|
||||
}
|
||||
}
|
||||
16
tools/benchmark-harness/fixtures/doc/fake.json
Normal file
16
tools/benchmark-harness/fixtures/doc/fake.json
Normal file
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"document": "../../../../test_documents/vendored/unstructured/doc/fake.doc",
|
||||
"file_type": "doc",
|
||||
"file_size": 18432,
|
||||
"expected_frameworks": ["kreuzberg", "tika", "unstructured"],
|
||||
"metadata": {
|
||||
"description": "Document from unstructured test suite",
|
||||
"source": "unstructured",
|
||||
"size_category": "small"
|
||||
},
|
||||
"ground_truth": {
|
||||
"text_file": "../../../../test_documents/ground_truth/doc/fake.txt",
|
||||
"source": "pandoc",
|
||||
"markdown_file": "../../../../test_documents/ground_truth/doc/fake.md"
|
||||
}
|
||||
}
|
||||
16
tools/benchmark-harness/fixtures/doc/simple.json
Normal file
16
tools/benchmark-harness/fixtures/doc/simple.json
Normal file
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"document": "../../../../test_documents/vendored/unstructured/doc/simple.doc",
|
||||
"file_type": "doc",
|
||||
"file_size": 15872,
|
||||
"expected_frameworks": ["kreuzberg", "tika", "unstructured"],
|
||||
"metadata": {
|
||||
"description": "Document from unstructured test suite",
|
||||
"source": "unstructured",
|
||||
"size_category": "small"
|
||||
},
|
||||
"ground_truth": {
|
||||
"text_file": "../../../../test_documents/ground_truth/doc/simple.txt",
|
||||
"source": "pandoc",
|
||||
"markdown_file": "../../../../test_documents/ground_truth/doc/simple.md"
|
||||
}
|
||||
}
|
||||
16
tools/benchmark-harness/fixtures/doc/unit_test_lists.json
Normal file
16
tools/benchmark-harness/fixtures/doc/unit_test_lists.json
Normal file
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"document": "../../../../test_documents/doc/unit_test_lists.doc",
|
||||
"file_type": "doc",
|
||||
"file_size": 16384,
|
||||
"expected_frameworks": ["kreuzberg"],
|
||||
"metadata": {
|
||||
"description": "doc test: unit_test_lists",
|
||||
"source": "pandoc-generated",
|
||||
"size_category": "small"
|
||||
},
|
||||
"ground_truth": {
|
||||
"text_file": "../../../../test_documents/ground_truth/doc/unit_test_lists.txt",
|
||||
"markdown_file": "../../../../test_documents/ground_truth/doc/unit_test_lists.md",
|
||||
"source": "pandoc"
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user