aws-samples
diff --git a/‎MANIFEST.in‎
Lines changed: 3 additions & 0 deletions b/‎MANIFEST.in‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎NOTICE‎
Lines changed: 1 addition & 1 deletion b/‎NOTICE‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎README.md‎
Lines changed: 6 additions & 5 deletions b/‎README.md‎
Lines changed: 6 additions & 5 deletions
diff --git a/‎docs/source/notebooks/imgs/excel.png‎
401 KB b/‎docs/source/notebooks/imgs/excel.png‎
401 KB
diff --git a/‎docs/source/notebooks/table_data_to_various_formats.ipynb‎
Lines changed: 73 additions & 11 deletions b/‎docs/source/notebooks/table_data_to_various_formats.ipynb‎
Lines changed: 73 additions & 11 deletions
diff --git a/‎extras/pandas.txt‎
Lines changed: 2 additions & 0 deletions b/‎extras/pandas.txt‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎requirements.txt‎
Lines changed: 0 additions & 2 deletions b/‎requirements.txt‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎setup.py‎
Lines changed: 1 addition & 1 deletion b/‎setup.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎textractor/cli/cli.py‎
Lines changed: 212 additions & 64 deletions b/‎textractor/cli/cli.py‎
Lines changed: 212 additions & 64 deletions
diff --git a/‎textractor/data/constants.py‎
Lines changed: 2 additions & 0 deletions b/‎textractor/data/constants.py‎
Lines changed: 2 additions & 0 deletions
@@ -0,0 +1,3 @@
+include *.txt
+recursive-include extras *.txt
+recursive-include textractor *
@@ -1,2 +1,2 @@
 Amazon Textract Textractor
-Copyright 2019 Amazon.com, Inc. or its affiliates. All Rights Reserved. 
+Copyright 2022 Amazon.com, Inc. or its affiliates. All Rights Reserved. 
@@ -14,13 +14,14 @@ If you are looking for the other amazon-textract-* packages, you can find them u
 
 ## Installation
 
-Textractor is available on PyPI and can be installed with `pip install amazon-textract-textractor`. By default this will install the minimal version of textractor. The following extras can be used to add features:
+Textractor is available on PyPI and can be installed with `pip install amazon-textract-textractor`. By default this will install the minimal version of Textractor which is suitable for lambda execution. The following extras can be used to add features:
 
-- `pdf` (`pip install amazon-textract-textractor[pdf]`) includes `pdf2image` and enables PDF rasterization in Textractor. Note that this is **not** necessary to call Textract with a PDF file.
-- `torch` (`pip install amazon-textract-textractor[torch]`) includes `sentence_transformers` for better word search and matching. This will work on CPU but be noticeably slower than non-machine learning based approaches.
-- `dev` (`pip install amazon-textract-textractor[dev]`) includes all the dependencies above and everything else needed to test the code.
+- `pandas` (`pip install "amazon-textract-textractor[pandas]"`) installs pandas which is used to enable DataFrame and CSV exports.
+- `pdf` (`pip install "amazon-textract-textractor[pdf]"`) includes `pdf2image` and enables PDF rasterization in Textractor. Note that this is **not** necessary to call Textract with a PDF file.
+- `torch` (`pip install "amazon-textract-textractor[torch]"`) includes `sentence_transformers` for better word search and matching. This will work on CPU but be noticeably slower than non-machine learning based approaches.
+- `dev` (`pip install "amazon-textract-textractor[dev]"`) includes all the dependencies above and everything else needed to test the code.
 
-You can pick several extras by separating the labels with commas like this `pip install amazon-textract-textractor[pdf,torch]`.
+You can pick several extras by separating the labels with commas like this `pip install "amazon-textract-textractor[pdf,torch]"`.
 
 ## Documentation
 
 
@@ -0,0 +1,2 @@
+numpy==1.21.*
+pandas
@@ -1,12 +1,10 @@
-numpy==1.21.*
 awscli
 amazon-textract-response-parser==0.1.33
 amazon-textract-caller==0.0.24
 boto3==1.24.*
 botocore==1.27.90
 jsonschema
 Pillow
-pandas
 tabulate==0.8.10
 XlsxWriter==3.0.3
 pyxDamerauLevenshtein==1.7.1
@@ -16,7 +16,7 @@ def read_requirements(path):
 setup(
     # include data files
     name="amazon-textract-textractor",
-    version="1.0.5",
+    version="1.0.6",
     description="A package to use AWS Textract services.",
     long_description=long_description,
     long_description_content_type="text/markdown",
 
@@ -209,6 +209,7 @@ class AnalyzeIDFields(Enum):
     # Only available in passports
     PLACE_OF_BIRTH = "PLACE_OF_BIRTH"
 
+
 class CLIPrint(Enum):
     ALL = 0
     TEXT = 1
@@ -218,6 +219,7 @@ class CLIPrint(Enum):
     EXPENSES = 5
     IDS = 6
 
+
 class CLIOverlay(Enum):
     ALL = 0
     WORDS = 1
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+include *.txt`
	`2`	`+recursive-include extras *.txt`
	`3`	`+recursive-include textractor *`
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`Amazon Textract Textractor`
`2`		`-Copyright 2019 Amazon.com, Inc. or its affiliates. All Rights Reserved.`
	`2`	`+Copyright 2022 Amazon.com, Inc. or its affiliates. All Rights Reserved.`