diff --git a/python/Textract-Table-Merged-Cells-And-Headers.ipynb b/python/Textract-Table-Merged-Cells-And-Headers.ipynb index 6002ca2..3ff7ee5 100644 --- a/python/Textract-Table-Merged-Cells-And-Headers.ipynb +++ b/python/Textract-Table-Merged-Cells-And-Headers.ipynb @@ -15,8 +15,10 @@ "source": [ "We will be using the modules below:\n", "* amazon-textract-caller (https://pypi.org/project/amazon-textract-caller/) to invoke Amazon Textract API on our behalf\n", - "* amazon-textract-response-parser (http://%28https//pypi.org/project/amazon-textract-response-parser/) to parse the response payload\n", - "* amazoon-textract-prettyprinter (https://pypi.org/project/amazon-textract-prettyprinter/) to \"pretty-print\" tables" + "* amazon-textract-response-parser (https://pypi.org/project/amazon-textract-response-parser/) to parse the response payload\n", + "* amazon-textract-prettyprinter (https://pypi.org/project/amazon-textract-prettyprinter/) to \"pretty-print\" tables\n", + "\n", + "The code can be ran using Python 3.7 or newer." ] }, { @@ -28,8 +30,7 @@ "source": [ "!pip install boto3\n", "!pip install amazon-textract-caller\n", - "!pip install amazon-textract-prettyprinter\n", - "!pip install trp" + "!pip install amazon-textract-prettyprinter" ] }, { @@ -117,7 +118,7 @@ "for page in trp_doc.pages:\n", " for table in page.tables:\n", " table_data = []\n", - " headers = table.get_header_field_names()\n", + " headers = []\n", " if(len(headers)>0): #Let's retain the only table with headers\n", " print(\"Statememt headers: \"+ repr(headers))\n", " top_header= headers[0]\n",