Loading...
Searching...
No Matches
DataExtractionModule.h
Go to the documentation of this file.
1//---------------------------------------------------------------------------------------
2// Copyright (c) 2001-2025 by Apryse Software Inc. All Rights Reserved.
3// Consult legal.txt regarding legal and license information.
4//---------------------------------------------------------------------------------------
5// !Warning! This file is autogenerated, modify the .codegen file, not this one
6// (any changes here will be wiped out during the autogen process)
7
8#ifndef PDFTRON_H_CPPPDFDataExtractionModule
9#define PDFTRON_H_CPPPDFDataExtractionModule
10#include <C/PDF/TRN_DataExtractionModule.h>
11
13#include <Common/BasicTypes.h>
14#include <Common/UString.h>
15#include <PDF/PDFDoc.h>
16
17namespace pdftron { namespace PDF {
18
24{
25public:
38
46
56 static UString ExtractData(const UString& input_pdf_file, DataExtractionEngine engine, DataExtractionOptions* options = 0);
57
67 static void ExtractData(const UString& input_pdf_file, const UString& output_json_file, DataExtractionEngine engine, DataExtractionOptions* options = 0);
68
77
85 static void ExtractToXLSX(const UString& input_pdf_file, const UString& output_xlsx_file, DataExtractionOptions* options = 0);
86
94 static void ExtractToXLSX(const UString& input_pdf_file, Filters::Filter& output_xlsx_stream, DataExtractionOptions* options = 0);
95
96};
97
98#include <Impl/DataExtractionModule.inl>
99} //end PDF
100} //end pdftron
101
102
103#endif //PDFTRON_H_CPPPDFDataExtractionModule
static bool IsModuleAvailable(DataExtractionEngine engine)
static void ExtractData(const UString &input_pdf_file, const UString &output_json_file, DataExtractionEngine engine, DataExtractionOptions *options=0)
static void ExtractToXLSX(const UString &input_pdf_file, const UString &output_xlsx_file, DataExtractionOptions *options=0)
static UString ExtractData(const UString &input_pdf_file, DataExtractionEngine engine, DataExtractionOptions *options=0)
static void DetectAndAddFormFieldsToPDF(PDFDoc &doc, DataExtractionOptions *options=0)
@ e_Form
Form field extraction engine. This engine uses artificial intelligence and computer vision to detect ...
@ e_DocClassification
Document classification engine. This engine uses artificial intelligence to assign predefined categor...
@ e_DocStructure
Document structure engine. This engine discovers the full logical structure, including headers,...
@ e_GenericKeyValue
Generic key value extraction engine. This engine uses artificial intelligence to detect arbitrary pai...
@ e_Tabular
Tabular Data engine. This engine identifies column and row structure and analyzes numeric columns....
@ e_FormKeyValue
Form field with key value extraction engine. This engine uses artificial intelligence and computer vi...
static void ExtractToXLSX(const UString &input_pdf_file, Filters::Filter &output_xlsx_stream, DataExtractionOptions *options=0)