This commit is contained in:
28
docs/snippets/c/getting-started/basic_usage.md
Normal file
28
docs/snippets/c/getting-started/basic_usage.md
Normal file
@@ -0,0 +1,28 @@
|
||||
```c title="C"
|
||||
#include <kreuzberg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
|
||||
int main(void) {
|
||||
KREUZBERGExtractionConfig *config = kreuzberg_extraction_config_default();
|
||||
|
||||
KREUZBERGExtractionResult *result =
|
||||
kreuzberg_extract_file("document.pdf", NULL, config);
|
||||
if (!result) {
|
||||
fprintf(stderr, "extraction failed (code %d): %s\n",
|
||||
kreuzberg_last_error_code(),
|
||||
kreuzberg_last_error_context());
|
||||
kreuzberg_extraction_config_free(config);
|
||||
return 1;
|
||||
}
|
||||
|
||||
char *content = kreuzberg_extraction_result_content(result);
|
||||
printf("%s\n", content ? content : "(empty)");
|
||||
kreuzberg_free_string(content);
|
||||
|
||||
kreuzberg_extraction_result_free(result);
|
||||
kreuzberg_extraction_config_free(config);
|
||||
return 0;
|
||||
}
|
||||
```
|
||||
39
docs/snippets/c/getting-started/extract_file.md
Normal file
39
docs/snippets/c/getting-started/extract_file.md
Normal file
@@ -0,0 +1,39 @@
|
||||
```c title="C"
|
||||
#include <kreuzberg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
|
||||
int main(void) {
|
||||
KREUZBERGExtractionResult *result =
|
||||
kreuzberg_extract_file("document.pdf", NULL, NULL);
|
||||
if (!result) {
|
||||
fprintf(stderr, "extraction failed (code %d): %s\n",
|
||||
kreuzberg_last_error_code(),
|
||||
kreuzberg_last_error_context());
|
||||
return 1;
|
||||
}
|
||||
|
||||
char *content = kreuzberg_extraction_result_content(result);
|
||||
printf("content:\n%s\n", content ? content : "(empty)");
|
||||
kreuzberg_free_string(content);
|
||||
|
||||
char *tables_json = kreuzberg_extraction_result_tables(result);
|
||||
printf("tables (JSON): %s\n", tables_json ? tables_json : "[]");
|
||||
kreuzberg_free_string(tables_json);
|
||||
|
||||
KREUZBERGMetadata *metadata = kreuzberg_extraction_result_metadata(result);
|
||||
if (metadata) {
|
||||
char *title = kreuzberg_metadata_title(metadata);
|
||||
char *language = kreuzberg_metadata_language(metadata);
|
||||
printf("title: %s\n", title ? title : "(none)");
|
||||
printf("language: %s\n", language ? language : "(none)");
|
||||
kreuzberg_free_string(title);
|
||||
kreuzberg_free_string(language);
|
||||
kreuzberg_metadata_free(metadata);
|
||||
}
|
||||
|
||||
kreuzberg_extraction_result_free(result);
|
||||
return 0;
|
||||
}
|
||||
```
|
||||
46
docs/snippets/c/getting-started/extract_with_ocr.md
Normal file
46
docs/snippets/c/getting-started/extract_with_ocr.md
Normal file
@@ -0,0 +1,46 @@
|
||||
```c title="C"
|
||||
#include <kreuzberg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
|
||||
int main(void) {
|
||||
const char *config_json =
|
||||
"{"
|
||||
"\"force_ocr\": true,"
|
||||
"\"ocr\": {\"backend\": \"tesseract\", \"language\": \"eng\"}"
|
||||
"}";
|
||||
|
||||
KREUZBERGExtractionConfig *config =
|
||||
kreuzberg_extraction_config_from_json(config_json);
|
||||
if (!config) {
|
||||
fprintf(stderr, "config init failed (code %d): %s\n",
|
||||
kreuzberg_last_error_code(),
|
||||
kreuzberg_last_error_context());
|
||||
return 1;
|
||||
}
|
||||
|
||||
KREUZBERGExtractionResult *result =
|
||||
kreuzberg_extract_file("scanned.pdf", NULL, config);
|
||||
if (!result) {
|
||||
fprintf(stderr, "extraction failed (code %d): %s\n",
|
||||
kreuzberg_last_error_code(),
|
||||
kreuzberg_last_error_context());
|
||||
kreuzberg_extraction_config_free(config);
|
||||
return 1;
|
||||
}
|
||||
|
||||
char *content = kreuzberg_extraction_result_content(result);
|
||||
printf("%s\n", content ? content : "(empty)");
|
||||
kreuzberg_free_string(content);
|
||||
|
||||
char *detected_languages = kreuzberg_extraction_result_detected_languages(result);
|
||||
printf("detected languages: %s\n",
|
||||
detected_languages ? detected_languages : "(none)");
|
||||
kreuzberg_free_string(detected_languages);
|
||||
|
||||
kreuzberg_extraction_result_free(result);
|
||||
kreuzberg_extraction_config_free(config);
|
||||
return 0;
|
||||
}
|
||||
```
|
||||
24
docs/snippets/c/getting-started/hello_world.md
Normal file
24
docs/snippets/c/getting-started/hello_world.md
Normal file
@@ -0,0 +1,24 @@
|
||||
```c title="C"
|
||||
#include <kreuzberg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
|
||||
int main(void) {
|
||||
KREUZBERGExtractionResult *result =
|
||||
kreuzberg_extract_file("document.pdf", NULL, NULL);
|
||||
if (!result) {
|
||||
fprintf(stderr, "extraction failed (code %d): %s\n",
|
||||
kreuzberg_last_error_code(),
|
||||
kreuzberg_last_error_context());
|
||||
return 1;
|
||||
}
|
||||
|
||||
char *content = kreuzberg_extraction_result_content(result);
|
||||
printf("%s\n", content ? content : "(empty)");
|
||||
kreuzberg_free_string(content);
|
||||
|
||||
kreuzberg_extraction_result_free(result);
|
||||
return 0;
|
||||
}
|
||||
```
|
||||
12
docs/snippets/c/getting-started/install_verify.md
Normal file
12
docs/snippets/c/getting-started/install_verify.md
Normal file
@@ -0,0 +1,12 @@
|
||||
```c title="C"
|
||||
#include <kreuzberg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
|
||||
int main(void) {
|
||||
const char *version = kreuzberg_version();
|
||||
printf("kreuzberg version: %s\n", version ? version : "(unknown)");
|
||||
return 0;
|
||||
}
|
||||
```
|
||||
38
docs/snippets/c/getting-started/read_content.md
Normal file
38
docs/snippets/c/getting-started/read_content.md
Normal file
@@ -0,0 +1,38 @@
|
||||
```c title="C"
|
||||
#include <kreuzberg.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
|
||||
int main(void) {
|
||||
KREUZBERGExtractionResult *result =
|
||||
kreuzberg_extract_file("document.pdf", NULL, NULL);
|
||||
if (!result) {
|
||||
fprintf(stderr, "extraction failed (code %d): %s\n",
|
||||
kreuzberg_last_error_code(),
|
||||
kreuzberg_last_error_context());
|
||||
return 1;
|
||||
}
|
||||
|
||||
char *content = kreuzberg_extraction_result_content(result);
|
||||
if (content) {
|
||||
printf("content length: %zu bytes\n", strlen(content));
|
||||
printf("%s\n", content);
|
||||
}
|
||||
kreuzberg_free_string(content);
|
||||
|
||||
/* Tables are returned as a JSON array string. A real consumer would
|
||||
* feed this into a JSON parser and walk each table's grid. */
|
||||
char *tables_json = kreuzberg_extraction_result_tables(result);
|
||||
if (tables_json) {
|
||||
printf("tables JSON (%zu bytes):\n%s\n",
|
||||
strlen(tables_json), tables_json);
|
||||
} else {
|
||||
printf("tables JSON: (none)\n");
|
||||
}
|
||||
kreuzberg_free_string(tables_json);
|
||||
|
||||
kreuzberg_extraction_result_free(result);
|
||||
return 0;
|
||||
}
|
||||
```
|
||||
Reference in New Issue
Block a user