All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
DataExtractionModule.h
Go to the documentation of this file.
1 //---------------------------------------------------------------------------------------
2 // Copyright (c) 2001-2023 by Apryse Software Inc. All Rights Reserved.
3 // Consult legal.txt regarding legal and license information.
4 //---------------------------------------------------------------------------------------
5 // !Warning! This file is autogenerated, modify the .codegen file, not this one
6 // (any changes here will be wiped out during the autogen process)
7 
8 #ifndef PDFTRON_H_CPPPDFDataExtractionModule
9 #define PDFTRON_H_CPPPDFDataExtractionModule
10 #include <C/PDF/TRN_DataExtractionModule.h>
11 
13 #include <Common/BasicTypes.h>
14 #include <Common/UString.h>
15 #include <PDF/PDFDoc.h>
16 
17 namespace pdftron { namespace PDF {
18 
24 {
25 public:
26  /*
27  * Data Extraction Engines
28  */
33  e_Tabular = 0,
37  e_Form = 1,
46  };
47 
54  static bool IsModuleAvailable(DataExtractionEngine engine);
55 
65  static UString ExtractData(const UString& input_pdf_file, DataExtractionEngine engine, DataExtractionOptions* options = 0);
66 
76  static void ExtractData(const UString& input_pdf_file, const UString& output_json_file, DataExtractionEngine engine, DataExtractionOptions* options = 0);
77 
85  static void DetectAndAddFormFieldsToPDF(PDFDoc& doc, DataExtractionOptions* options = 0);
86 
94  static void ExtractToXLSX(const UString& input_pdf_file, const UString& output_xlsx_file, DataExtractionOptions* options = 0);
95 
103  static void ExtractToXLSX(const UString& input_pdf_file, Filters::Filter& output_xlsx_stream, DataExtractionOptions* options = 0);
104 
105 };
106 
107 #include <Impl/DataExtractionModule.inl>
108 } //end PDF
109 } //end pdftron
110 
111 
112 #endif //PDFTRON_H_CPPPDFDataExtractionModule
static bool IsModuleAvailable(DataExtractionEngine engine)
static UString ExtractData(const UString &input_pdf_file, DataExtractionEngine engine, DataExtractionOptions *options=0)
static void DetectAndAddFormFieldsToPDF(PDFDoc &doc, DataExtractionOptions *options=0)
static void ExtractToXLSX(const UString &input_pdf_file, const UString &output_xlsx_file, DataExtractionOptions *options=0)