From a4e916d68c869bf7b5147f1e5a75ecb141174913 Mon Sep 17 00:00:00 2001 From: Jun-te Kim Date: Wed, 12 Mar 2025 14:57:39 +0000 Subject: [PATCH] q16 --- etl/pdfReader/sitenotes.py | 27 +++++++++++++++++++++++++++ 1 file changed, 27 insertions(+) diff --git a/etl/pdfReader/sitenotes.py b/etl/pdfReader/sitenotes.py index 1120bbe..86c25b0 100644 --- a/etl/pdfReader/sitenotes.py +++ b/etl/pdfReader/sitenotes.py @@ -40,6 +40,8 @@ class QuidosSiteNotes(SiteNotesExtractor): self.get_section_14_1() self.get_section_14_2() self.get_section_15_0() + self.get_section_15_1() + self.get_section_16() def get_summary_information(self): # Summary Information @@ -461,6 +463,31 @@ class QuidosSiteNotes(SiteNotesExtractor): ] self.two_columns_processor(data, sub_titles, avoid, 15.0) + def get_section_15_1(self): + data = self.raw_data[self.raw_data.index("15.1 Hot Water Cylinder"):self.raw_data.index("16.0 Solar Water Heating")] + sub_tites = [ + "Volume", + "Insulation Type", + "Insulation Thickness", + "Thermostat", + ] + avoid = [ + "16.0 Solar Water Heating", + "15.1 Hot Water Cylinder" + ] + self.two_columns_processor(data, sub_tites, avoid, 15.1) + + def get_section_16(self): + data = self.raw_data[self.raw_data.index("16.0 Solar Water Heating"):self.raw_data.index("17.0 Waste Water Heat Recovery System")] + avoid = [ + "16.0 Solar Water Heating", + "17.0 Waste Water Heat Recovery System", + ] + sub_titles = [ + "Solar Water Heating Details Known?" + ] + + self.two_columns_processor(data, sub_titles, avoid, 16.0) # Extract # Transform ( wiht validation pydantnic) # Load \ No newline at end of file