23 lines
513 B
JSON
23 lines
513 B
JSON
|
|
{
|
||
|
|
"document": "../../../test_documents/images_extra/ocr_image.tiff",
|
||
|
|
"file_type": "tiff",
|
||
|
|
"file_size": 367848,
|
||
|
|
"expected_frameworks": [
|
||
|
|
"kreuzberg",
|
||
|
|
"docling",
|
||
|
|
"markitdown",
|
||
|
|
"pymupdf4llm",
|
||
|
|
"tika",
|
||
|
|
"unstructured"
|
||
|
|
],
|
||
|
|
"metadata": {
|
||
|
|
"description": "TIFF image with text for OCR testing",
|
||
|
|
"category": "image",
|
||
|
|
"requires_ocr": true
|
||
|
|
},
|
||
|
|
"ground_truth": {
|
||
|
|
"text_file": "../../../test_documents/ground_truth/tiff/image_tiff.md",
|
||
|
|
"source": "mistral-pixtral"
|
||
|
|
}
|
||
|
|
}
|