diff analyze_document/app.py @ 10:2350662483a3

fix minor bugs
author Dennis C. M. <dennis@denniscm.com>
date Thu, 08 Jun 2023 17:16:36 +0100
parents bf19235a9636
children
line wrap: on
line diff
--- a/analyze_document/app.py	Wed Jun 07 11:07:14 2023 +0100
+++ b/analyze_document/app.py	Thu Jun 08 17:16:36 2023 +0100
@@ -13,8 +13,8 @@
     bucket_name = event_detail['bucket']['name']
     object_key = event_detail['object']['key']
 
-    company_ticker = re.search('unprocessed/(.*)_', object_key).group(1)
-    doc_type = re.search(f'unprocessed/{company_ticker}_(.*)_', object_key).group(1)
+    company_ticker = re.search('unprocessed/(.*?)_', object_key).group(1)
+    doc_type = re.search(f'unprocessed/{company_ticker}_(.*?)_', object_key).group(1)
     file_id = str(uuid.uuid4())
 
     data_dict = textract_client.analyze_document(