Nomad changes
All checks were successful
Deploy fil (kreuzberg) / deploy (push) Successful in 49s

This commit is contained in:
Henrik Jess Nielsen
2026-06-01 23:40:55 +02:00
parent 72b1a0a6ed
commit b4c07d3693
5723 changed files with 1130655 additions and 0 deletions

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-comma-in-cell.csv",
"file_type": "csv",
"file_size": 46,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-comma-in-cell.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-comma-in-cell.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-comma.csv",
"file_type": "csv",
"file_size": 1005,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-comma.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-comma.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-inconsistent-header.csv",
"file_type": "csv",
"file_size": 42,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-inconsistent-header.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-inconsistent-header.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-pipe.csv",
"file_type": "csv",
"file_size": 997,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-pipe.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-pipe.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-semicolon.csv",
"file_type": "csv",
"file_size": 997,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-semicolon.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-semicolon.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-tab.csv",
"file_type": "csv",
"file_size": 997,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-tab.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-tab.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-too-few-columns.csv",
"file_type": "csv",
"file_size": 44,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-too-few-columns.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-too-few-columns.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/docling/csv/csv-too-many-columns.csv",
"file_type": "csv",
"file_size": 46,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from docling test suite",
"source": "docling",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/csv-too-many-columns.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/csv-too-many-columns.md"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/csv/data_table.csv",
"file_type": "csv",
"file_size": 476,
"expected_frameworks": ["kreuzberg"],
"metadata": {
"description": "csv test: data_table",
"source": "pandoc-generated",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/data_table.txt",
"markdown_file": "../../../../test_documents/ground_truth/csv/data_table.md",
"source": "pandoc"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/csv/stanley_cups.csv",
"file_type": "csv",
"file_size": 91,
"expected_frameworks": ["kreuzberg"],
"metadata": {
"description": "csv test: stanley_cups",
"source": "pandoc-generated",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/stanley_cups.txt",
"markdown_file": "../../../../test_documents/ground_truth/csv/stanley_cups.md",
"source": "pandoc"
}
}

View File

@@ -0,0 +1,16 @@
{
"document": "../../../../test_documents/vendored/markitdown/csv/test_mskanji.csv",
"file_type": "csv",
"file_size": 70,
"expected_frameworks": ["kreuzberg", "docling", "markitdown", "pandoc", "tika", "unstructured"],
"metadata": {
"description": "Document from markitdown test suite",
"source": "markitdown",
"size_category": "small"
},
"ground_truth": {
"text_file": "../../../../test_documents/ground_truth/csv/test_mskanji.txt",
"source": "pandoc",
"markdown_file": "../../../../test_documents/ground_truth/csv/test_mskanji.md"
}
}