From 341eb2db9a3af84ea85ebcb4a8a65fc48496c579 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= Date: Sun, 19 Feb 2023 17:08:25 +0100 Subject: [PATCH] Provide Invoice2Data class for object oriented usage MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit This will allow using invoice2data in an object oriented way like: import invoice2data i2d = invoice2data.Invoice2Data() i2d.extract_data("foo.pdf") Signed-off-by: Rafał Miłecki --- src/invoice2data/__init__.py | 1 + src/invoice2data/main.py | 13 +++++++++++++ 2 files changed, 14 insertions(+) diff --git a/src/invoice2data/__init__.py b/src/invoice2data/__init__.py index d6a0cc0d..3d88e595 100644 --- a/src/invoice2data/__init__.py +++ b/src/invoice2data/__init__.py @@ -1 +1,2 @@ from .main import extract_data # noqa: F401 +from .main import Invoice2Data # noqa: F401 diff --git a/src/invoice2data/main.py b/src/invoice2data/main.py index c322b179..2803fc49 100644 --- a/src/invoice2data/main.py +++ b/src/invoice2data/main.py @@ -37,6 +37,19 @@ output_mapping = {"csv": to_csv, "json": to_json, "xml": to_xml, "none": None} +class Invoice2Data: + def __init__(self, load_built_in_templates=True): + self.templates = [] + if load_built_in_templates: + self.templates += read_templates() + + def read_templates(self, path): + self.templates += read_templates(os.path.abspath(path)) + + def extract_data(self, path, input_module=None): + return extract_data(path, self.templates, input_module) + + def extract_data(invoicefile, templates=None, input_module=None): """Extracts structured data from PDF/image invoices.