import pandas as pd from tqdm import tqdm from epc_data.temp_inputs import input_data from epc_data.Property import Property from epc_data.config import EPC_AUTH_TOKEN from epc_api.client import EpcClient from epc_data.downloader import pagenated_epc_download from epc_data.EpcClean import EpcClean def handler(): # To begin with, the input data is a list of dictionaries, however we would read this file in epc_client = EpcClient(auth_token=EPC_AUTH_TOKEN) input_properties = [ Property(postcode=config['postcode'], address1=config['address1'], epc_client=epc_client) for config in input_data ] for p in input_properties: p.search_address_epc() local_authorities = {p.data['local-authority'] for p in input_properties} data = [] for la in tqdm(local_authorities): data.extend( pagenated_epc_download( client=epc_client, params={"local-authority": la}, page_size=5000, n_pages=10, ) ) cleaner = EpcClean(data) cleaner.clean() # For testing: from epc_data.attributes.WindowAttributes import WindowAttributes descriptions = {x["windows-description"] for x in data} out = [] for description in descriptions: res = WindowAttributes(description).process() out.append( { "original_description": description, **res } ) df = pd.DataFrame(out) df = df.sort_values("original_description") df = df.reset_index(drop=True) import numpy as np idx = 88 record = df[df.index == idx].to_dict("records")[0] record = {k: v for k, v in record.items() if v not in [None, np.nan, False]} from pprint import pprint pprint(record) # This has has_electric as true and not sure if we want that description = 'Boiler and radiators, mains gas, Electric storage heaters' # This has has_electric as true and has has_underfloor_heating as true and has_electric_underfloor_heating as true # and not sure if we want that but might be fine description = 'Boiler and radiators, mains gas, Electric underfloor heating' z = df[df["original_description"] == 'Air source heat pump, radiators and underfloor, electric'] # LPG boiler df.to_dict("records")