diff --git a/deployment/lambda/extractor_and_loader/docker/app.py b/deployment/lambda/extractor_and_loader/docker/app.py index 929c16a..510af31 100644 --- a/deployment/lambda/extractor_and_loader/docker/app.py +++ b/deployment/lambda/extractor_and_loader/docker/app.py @@ -199,7 +199,7 @@ def handler(event, context): local_path = download_private_s3_file(file_uri) print("Extracting file...") - reader = pdfReaderToText(local_path) + reader = pdfReaderToText(local_path, logger=False) obj = WarmHomesConditionReport(reader.text_list) json_ = make_final_json(obj.master_obj[0], obj.master_obj[1]) print("Extracted completed, made json") diff --git a/etl/fileReader/pdfReaderToText.py b/etl/fileReader/pdfReaderToText.py index c1d5834..a4d11a4 100644 --- a/etl/fileReader/pdfReaderToText.py +++ b/etl/fileReader/pdfReaderToText.py @@ -15,9 +15,10 @@ from pprint import pprint class pdfReaderToText(): - def __init__(self, file_path): + def __init__(self, file_path, logger=True): self.source_path = file_path - self.logger = Logger(name='pdfReader', level=logging.INFO).get_logger() + if logger: + self.logger = Logger(name='pdfReader', level=logging.INFO).get_logger() self.all_text = "" self.text_list = [] self.get_text_from_pdf_file()