changeset 9:bf19235a9636

minor bugs and add sample reports
author Dennis C. M. <dennis@denniscm.com>
date Wed, 07 Jun 2023 11:07:14 +0100
parents f2442b8f43de
children 2350662483a3
files analyze_document/app.py process_document/app.py reports/2022/acx_balance_1.pdf reports/2022/acx_balance_2.pdf reports/2022/acx_pnl_1.pdf reports/2022/itx_balance_1.pdf reports/2022/itx_pnl_1.pdf reports/2022/san_balance_1.pdf reports/2022/san_balance_2.pdf reports/2022/san_balance_3.pdf reports/2022/san_balance_4.pdf reports/2022/san_pnl_1.pdf reports/2022/san_pnl_2.pdf reports/itx_balance.pdf reports/san_balance.pdf
diffstat 15 files changed, 2 insertions(+), 2 deletions(-) [+]
line wrap: on
line diff
--- a/analyze_document/app.py	Mon Jun 05 20:07:22 2023 +0100
+++ b/analyze_document/app.py	Wed Jun 07 11:07:14 2023 +0100
@@ -14,7 +14,7 @@
     object_key = event_detail['object']['key']
 
     company_ticker = re.search('unprocessed/(.*)_', object_key).group(1)
-    doc_type = re.search(f'unprocessed/{company_ticker}_(.*).pdf', object_key).group(1)
+    doc_type = re.search(f'unprocessed/{company_ticker}_(.*)_', object_key).group(1)
     file_id = str(uuid.uuid4())
 
     data_dict = textract_client.analyze_document(
--- a/process_document/app.py	Mon Jun 05 20:07:22 2023 +0100
+++ b/process_document/app.py	Wed Jun 07 11:07:14 2023 +0100
@@ -152,7 +152,7 @@
     for amount_format in amount_formats:
         plural_amount_format = f'{amount_format}s'
 
-        if amount_format in phrase or plural_amount_format in phrase:
+        if amount_format in phrase.lower() or plural_amount_format in phrase.lower():
             return amount_format
 
 
Binary file reports/2022/acx_balance_1.pdf has changed
Binary file reports/2022/acx_balance_2.pdf has changed
Binary file reports/2022/acx_pnl_1.pdf has changed
Binary file reports/2022/itx_balance_1.pdf has changed
Binary file reports/2022/itx_pnl_1.pdf has changed
Binary file reports/2022/san_balance_1.pdf has changed
Binary file reports/2022/san_balance_2.pdf has changed
Binary file reports/2022/san_balance_3.pdf has changed
Binary file reports/2022/san_balance_4.pdf has changed
Binary file reports/2022/san_pnl_1.pdf has changed
Binary file reports/2022/san_pnl_2.pdf has changed
Binary file reports/itx_balance.pdf has changed
Binary file reports/san_balance.pdf has changed