mirror of
https://github.com/Hestia-Homes/Model.git
synced 2026-06-08 11:17:27 +00:00
Merge pull request #495 from Hestia-Homes/funding-engine
Funding engine - fixed multiple bugs, working on an offline testing framework
This commit is contained in:
commit
f6f8c3305d
20 changed files with 708 additions and 113 deletions
|
|
@ -1,54 +1,14 @@
|
|||
from etl.epc.settings import DATA_ANOMALY_MATCHES as data_anon_matches
|
||||
from etl.epc.settings import DATA_ANOMALY_MATCHES as data_anon_matches
|
||||
|
||||
|
||||
class Definitions:
|
||||
"""
|
||||
This class contains some base attributes which are used across multiple other classes
|
||||
"""
|
||||
|
||||
# Anomalies described here: https://epc.opendatacommunities.org/docs/guidance#glossary
|
||||
DATA_ANOMALY_MATCHES = {
|
||||
# Invalid reports are where the value provided is out of bounds, e.g. a negative energy rating of -1199 or a
|
||||
# non-integer, there is no valid energy band for this, so it is marked as INVALID!
|
||||
"INVALID",
|
||||
"INVALID!",
|
||||
# When the energy certificate was first lodged on the register there was no requirement to lodge this data
|
||||
# item, i.e. a non-mandatory item.
|
||||
"NO DATA!",
|
||||
"NODATA!",
|
||||
# When the energy certificate was first lodged on the register there was no requirement to lodge this data item,
|
||||
# i.e.a non - mandatory item.
|
||||
"N/A",
|
||||
# A value generated by the register to account for a data item that was not mandatory when the lodgement of
|
||||
# the energy certificate occurred. When the data item became mandatory the register operator, for backwards
|
||||
# compatibility purposes, populated the data field with a value of ‘not recorded’ to ensure that the energy
|
||||
# certificate retrieval process is successfully completed. Mandatory data items cannot be applied
|
||||
# retrospectively to energy certificates lodged before the date of the change.
|
||||
"Not recorded",
|
||||
# The data also contains DECs with an operational rating of ‘9999’ (a ‘default’ DEC). The production of a
|
||||
# ‘default’ DEC value was allowed to enable building occupiers, with poor quality or no energy data,
|
||||
# the opportunity to comply with the regulations. From April 2011 the ability to lodge a ‘default’ DEC was no
|
||||
# longer allowed.
|
||||
"9999",
|
||||
# The Building Emission Rate (BER) data field for non-domestic buildings may contain a ‘blank’ value. The BER
|
||||
# was only lodged on the register from 7 March 2010.
|
||||
"Blank"
|
||||
# There are currently just over 8,600 records where the local authority identifier is ‘null’. This is due to
|
||||
# the Register Operator not being able to match the building address in the Markermap Ordinance Survey (GB)
|
||||
# lookup tables or OS MasterMap Address Layer 2 data. The majority of these addresses have been requested
|
||||
# manually by energy assessors for inclusion by the Register Operator in the registers (e.g. new builds,
|
||||
# etc). These records are being published for completeness. An ongoing process to manage these manually added
|
||||
# addresses will take time to develop to deal with these and future anomalies.
|
||||
#
|
||||
# There are several fields within the lodged data where it is possible to enter multiple entries to cater for
|
||||
# different data_types of build within a single property, i.e. extensions. This results in multiple entries for
|
||||
# the description fields for floor, roof and wall. For the purposes of this data release only the information
|
||||
# contained within the first of these multiple entries is being provided. As there are no restrictions on the
|
||||
# value in this first field it means that sometimes the first field in a multiple entry description field may
|
||||
# contain a ‘null’ value. A resolution to correct these anomalies will be considered for future data releases.
|
||||
"NULL",
|
||||
# We sometimes see fields populated with just an empty string.
|
||||
"",
|
||||
# An older value which rarely shows up but has been seen in the data.
|
||||
"UNKNOWN",
|
||||
}
|
||||
DATA_ANOMALY_MATCHES = data_anon_matches
|
||||
|
||||
DATA_ANOMALY_SUBSTRINGS = {
|
||||
# Where values in a ‘pick’ list that have been superseded by another value. For example, where a value for
|
||||
|
|
|
|||
|
|
@ -1376,10 +1376,16 @@ class AssetList:
|
|||
# 3) We don't remove anything that haas access issues yet
|
||||
|
||||
if self.non_intrusives_present:
|
||||
non_intrusives_wall_filter = (
|
||||
(self.standardised_asset_list['non-intrusives: Construction'] == "CAVITY") &
|
||||
self.standardised_asset_list['non-intrusives: Insulated'].isin(["EMPTY", "PARTIAL"])
|
||||
)
|
||||
if self.new_format_non_insturives_present_v2:
|
||||
non_intrusives_wall_filter = (
|
||||
(self.standardised_asset_list['non-intrusives: Construction'] == "CAVITY") &
|
||||
self.standardised_asset_list['non-intrusives: Insulated'].isin(["EMPTY", "PARTIAL", "EMPTY CAVITY"])
|
||||
)
|
||||
else:
|
||||
non_intrusives_wall_filter = (
|
||||
(self.standardised_asset_list['non-intrusives: Construction'] == "CAVITY") &
|
||||
self.standardised_asset_list['non-intrusives: Insulated'].isin(["EMPTY", "PARTIAL"])
|
||||
)
|
||||
elif self.old_format_non_intrusives_present:
|
||||
non_intrusives_wall_filter = (
|
||||
self.standardised_asset_list['non-intrusives: WFT Findings'].str.lower().str.strip().isin(
|
||||
|
|
|
|||
|
|
@ -59,25 +59,25 @@ def app():
|
|||
Property UPRN
|
||||
"""
|
||||
|
||||
# Colchester
|
||||
data_folder = "/Users/khalimconn-kowlessar/Documents/hestia/Customers/Colchester/Aug2025 202 inspections"
|
||||
data_filename = "Colchester Borough Homes - Inspections - Additional 202 Addresses JW 280725 copy.xlsx"
|
||||
sheet_name = "Extra 202 Colchester Addresses"
|
||||
postcode_column = 'domna_postcode'
|
||||
address1_column = "domna_address_1"
|
||||
# Lambeth
|
||||
data_folder = "/Users/khalimconn-kowlessar/Documents/hestia/Customers/Lambeth"
|
||||
data_filename = "LAMBETH Asset List ( Incomplete).xlsx"
|
||||
sheet_name = "Green properties"
|
||||
postcode_column = 'SX3 Postcode'
|
||||
address1_column = "SX3 Short Address"
|
||||
address1_method = None
|
||||
fulladdress_column = "domna_full_address"
|
||||
address_cols_to_concat = []
|
||||
fulladdress_column = None
|
||||
address_cols_to_concat = ["SX3 Short Address"]
|
||||
missing_postcodes_method = None
|
||||
landlord_year_built = None
|
||||
landlord_os_uprn = None
|
||||
landlord_property_type = "landlord_property_type"
|
||||
landlord_built_form = "landlord_built_form"
|
||||
landlord_property_type = "Property Type"
|
||||
landlord_built_form = None
|
||||
landlord_wall_construction = None
|
||||
landlord_roof_construction = None
|
||||
landlord_heating_system = None
|
||||
landlord_existing_pv = None
|
||||
landlord_property_id = "landlord_property_id"
|
||||
landlord_property_id = "row_id"
|
||||
landlord_sap = None
|
||||
outcomes_filename = None
|
||||
outcomes_sheetname = None
|
||||
|
|
@ -91,7 +91,41 @@ def app():
|
|||
phase = False
|
||||
ecosurv_landlords = None
|
||||
asset_list_header = 0
|
||||
landlord_block_reference = "landlord_block_reference"
|
||||
landlord_block_reference = None
|
||||
|
||||
# # Colchester
|
||||
# data_folder = "/Users/khalimconn-kowlessar/Documents/hestia/Customers/Colchester/Aug2025 202 inspections"
|
||||
# data_filename = "Colchester Borough Homes - Inspections - Additional 202 Addresses JW 280725 copy.xlsx"
|
||||
# sheet_name = "Extra 202 Colchester Addresses"
|
||||
# postcode_column = 'domna_postcode'
|
||||
# address1_column = "domna_address_1"
|
||||
# address1_method = None
|
||||
# fulladdress_column = "domna_full_address"
|
||||
# address_cols_to_concat = []
|
||||
# missing_postcodes_method = None
|
||||
# landlord_year_built = None
|
||||
# landlord_os_uprn = None
|
||||
# landlord_property_type = "landlord_property_type"
|
||||
# landlord_built_form = "landlord_built_form"
|
||||
# landlord_wall_construction = None
|
||||
# landlord_roof_construction = None
|
||||
# landlord_heating_system = None
|
||||
# landlord_existing_pv = None
|
||||
# landlord_property_id = "landlord_property_id"
|
||||
# landlord_sap = None
|
||||
# outcomes_filename = None
|
||||
# outcomes_sheetname = None
|
||||
# outcomes_postcode = None
|
||||
# outcomes_houseno = None
|
||||
# outcomes_id = None
|
||||
# outcomes_address = None
|
||||
# master_filepaths = []
|
||||
# master_id_colnames = []
|
||||
# master_to_asset_list_filepath = None
|
||||
# phase = False
|
||||
# ecosurv_landlords = None
|
||||
# asset_list_header = 0
|
||||
# landlord_block_reference = "landlord_block_reference"
|
||||
|
||||
# # Abri
|
||||
# data_folder = "/Users/khalimconn-kowlessar/Documents/hestia/Customers/Abri/Post Inspections"
|
||||
|
|
@ -128,38 +162,38 @@ def app():
|
|||
# landlord_block_reference = None
|
||||
|
||||
# Freebridge
|
||||
# data_folder = "/Users/khalimconn-kowlessar/Documents/hestia/Customers/Freebridge"
|
||||
# data_filename = "Domna - FCH property data May 25 copy.xlsx"
|
||||
# sheet_name = "EPC Data"
|
||||
# postcode_column = 'Post Code'
|
||||
# address1_column = "Address 1"
|
||||
# address1_method = None
|
||||
# fulladdress_column = None
|
||||
# address_cols_to_concat = ["Address 1", "Address 4"]
|
||||
# missing_postcodes_method = None
|
||||
# landlord_year_built = "Build Date"
|
||||
# landlord_os_uprn = None
|
||||
# landlord_property_type = "Property Type"
|
||||
# landlord_built_form = None
|
||||
# landlord_wall_construction = "Walls Description"
|
||||
# landlord_heating_system = "Heating Type"
|
||||
# landlord_existing_pv = None
|
||||
# landlord_property_id = "Place Ref"
|
||||
# landlord_roof_construction = "Roof Description"
|
||||
# landlord_sap = "Current SAP"
|
||||
# outcomes_filename = []
|
||||
# outcomes_sheetname = []
|
||||
# outcomes_postcode = []
|
||||
# outcomes_houseno = []
|
||||
# outcomes_address = []
|
||||
# outcomes_id = []
|
||||
# master_filepaths = []
|
||||
# master_to_asset_list_filepath = None
|
||||
# asset_list_header = 0
|
||||
# landlord_block_reference = None
|
||||
# master_id_colnames = []
|
||||
# phase = True # Inspections not complete, produce a partial view
|
||||
# ecosurv_landlords = None
|
||||
data_folder = "/Users/khalimconn-kowlessar/Documents/hestia/Customers/Freebridge/Aug2025 programme"
|
||||
data_filename = "Domna - FCH property data May 25 copy.xlsx"
|
||||
sheet_name = "EPC Data"
|
||||
postcode_column = 'Post Code'
|
||||
address1_column = "Address 1"
|
||||
address1_method = None
|
||||
fulladdress_column = None
|
||||
address_cols_to_concat = ["Address 1", "Address 4"]
|
||||
missing_postcodes_method = None
|
||||
landlord_year_built = "Build Date"
|
||||
landlord_os_uprn = None
|
||||
landlord_property_type = "Property Type"
|
||||
landlord_built_form = None
|
||||
landlord_wall_construction = "Walls Description"
|
||||
landlord_heating_system = "Heating Type"
|
||||
landlord_existing_pv = None
|
||||
landlord_property_id = "Place Ref"
|
||||
landlord_roof_construction = "Roof Description"
|
||||
landlord_sap = "Current SAP"
|
||||
outcomes_filename = []
|
||||
outcomes_sheetname = []
|
||||
outcomes_postcode = []
|
||||
outcomes_houseno = []
|
||||
outcomes_address = []
|
||||
outcomes_id = []
|
||||
master_filepaths = []
|
||||
master_to_asset_list_filepath = None
|
||||
asset_list_header = 0
|
||||
landlord_block_reference = None
|
||||
master_id_colnames = []
|
||||
phase = False # Inspections not complete, produce a partial view
|
||||
ecosurv_landlords = None
|
||||
|
||||
# data_folder = "/Users/khalimconn-kowlessar/Documents/hestia/Customers/Broadlands"
|
||||
# data_filename = "Broadlands Asset List.xlsx"
|
||||
|
|
|
|||
|
|
@ -341,5 +341,7 @@ PROPERTY_MAPPING = {
|
|||
'house': 'house',
|
||||
'block of flats': 'block of flats',
|
||||
'bungalow': 'bungalow',
|
||||
'flat': 'flat'
|
||||
'flat': 'flat',
|
||||
'FLA': 'flat',
|
||||
'HOU': 'house'
|
||||
}
|
||||
|
|
|
|||
|
|
@ -358,11 +358,13 @@ class Funding:
|
|||
|
||||
# Format the starting U-value according to special rules
|
||||
if closest_starting == 0.45:
|
||||
starting_str = "2"
|
||||
starting_str = "0.45"
|
||||
elif closest_starting == 2.00:
|
||||
starting_str = "2.0"
|
||||
elif closest_starting == 1.70:
|
||||
starting_str = "1.7"
|
||||
elif closest_starting == 1:
|
||||
starting_str = "1.0"
|
||||
else:
|
||||
starting_str = f"{closest_starting:.2f}"
|
||||
|
||||
|
|
@ -618,7 +620,7 @@ class Funding:
|
|||
]
|
||||
|
||||
if solar_pps_df.empty and self.starting_sap_band in [
|
||||
"Low_C", "High_C", "Low_B", "High_B", "Low_B", "High_A"
|
||||
"Low_C", "High_C", "Low_B", "High_B", "Low_B", "High_A", "Low_A"
|
||||
]:
|
||||
# No funding for EPC C or above
|
||||
return 0
|
||||
|
|
@ -670,6 +672,9 @@ class Funding:
|
|||
return 0
|
||||
|
||||
if measure_type in ["double_glazing", "secondary_glazing"]:
|
||||
# No funding for EPC C or above
|
||||
if self.starting_sap_band in ["Low_C", "High_C", "Low_B", "High_B", "Low_A", "High_A"]:
|
||||
return 0
|
||||
# pps is under the WG_singletodouble Measure_Type
|
||||
pps = filtered_pps_matrix[
|
||||
filtered_pps_matrix["Measure_Type"] == "WG_singletodouble"
|
||||
|
|
@ -716,12 +721,15 @@ class Funding:
|
|||
else:
|
||||
pps = filtered_pps_matrix[
|
||||
(filtered_pps_matrix["Pre_Main_Heating_Source"] == pre_heating_system) &
|
||||
(filtered_pps_matrix["Post_Main_Heating_Source"] == "Condensing Gas Boiler") &
|
||||
(filtered_pps_matrix["Measure_Type"] == "B_Upgrade_preHCs")
|
||||
(filtered_pps_matrix["Post_Main_Heating_Source"] == "Condensing Gas Boiler")
|
||||
# (filtered_pps_matrix["Measure_Type"] == "B_Upgrade_preHCs")
|
||||
]
|
||||
# Depending on different systems, e.g. room heaters, we take the best options
|
||||
if pps.shape[0] > 1:
|
||||
pps = pps[pps["Cost Savings"] == min(pps["Cost Savings"])].head(1)
|
||||
|
||||
# No funding for EPC C or above
|
||||
if self.starting_sap_band in ["Low_C", "High_C", "Low_B", "High_B", "Low_A", "High_A"] and pps.empty:
|
||||
if self.starting_sap_band in ["Low_C", "High_C", "Low_B", "High_B", "Low_A", "High_A"] or pps.empty:
|
||||
return 0
|
||||
|
||||
if pps.shape[0] != 1:
|
||||
|
|
|
|||
|
|
@ -624,7 +624,10 @@ class Property:
|
|||
if len(attributes) == 0:
|
||||
# We attempt to perform the clean on the fly
|
||||
cleaner_cls = all_cleaner_map[description]
|
||||
cleaner_cls = cleaner_cls(self.data[description])
|
||||
if description == "lighting-description":
|
||||
cleaner_cls = cleaner_cls(self.data[description], averages=None)
|
||||
else:
|
||||
cleaner_cls = cleaner_cls(self.data[description])
|
||||
processed = {
|
||||
"original_description": self.data[description],
|
||||
"clean_description": cleaner_cls.description.replace(
|
||||
|
|
@ -1165,7 +1168,8 @@ class Property:
|
|||
'heat pump': 'Electricity',
|
||||
'solid fuel boiler': 'Solid Fuel',
|
||||
'solid fuel range cooker': 'Solid Fuel',
|
||||
'room heaters': 'Varied' # Could be any fuel, further specifics needed based on context
|
||||
'room heaters': 'Varied', # Could be any fuel, further specifics needed based on context
|
||||
"single-point gas": "Natural Gas"
|
||||
}
|
||||
|
||||
# Define a mapping from system types to general categories or modifications of fuel types
|
||||
|
|
@ -1176,6 +1180,11 @@ class Property:
|
|||
'community scheme': 'Community Scheme'
|
||||
}
|
||||
|
||||
hotwater_appliance_to_fuel = {
|
||||
'gas range cooker': 'Natural Gas',
|
||||
'oil range cooker': 'Oil'
|
||||
}
|
||||
|
||||
self.heating_energy_source = list({
|
||||
fuel for key, fuel in heating_fuel_mapping.items() if self.main_heating.get(key, False)
|
||||
})
|
||||
|
|
@ -1202,8 +1211,13 @@ class Property:
|
|||
self.heating_energy_source = self.heating_energy_source[0]
|
||||
|
||||
if self.heating_energy_source == "Varied (Community Scheme)":
|
||||
if self.main_fuel["fuel_type"] in ["mains gas", None]: # We assume when None as it's unknown
|
||||
self.heating_energy_source = "Natural Gas (Community Scheme)"
|
||||
fuel_map = {
|
||||
None: "Natural Gas (Community Scheme)",
|
||||
"mains gas": "Natural Gas (Community Scheme)",
|
||||
"biomass": "Smokeless Fuel",
|
||||
}
|
||||
if self.main_fuel["fuel_type"] in fuel_map: # We assume when None as it's unknown
|
||||
self.heating_energy_source = fuel_map[self.main_fuel["fuel_type"]]
|
||||
else:
|
||||
raise Exception("Implement me")
|
||||
|
||||
|
|
@ -1213,8 +1227,7 @@ class Property:
|
|||
if self.hotwater["extra_features"] == "plus solar":
|
||||
self.hot_water_energy_source = self.heating_energy_source + " + Solar Thermal"
|
||||
return
|
||||
|
||||
else:
|
||||
elif self.hotwater["system_type"] is not None:
|
||||
fuel = system_type_modification[self.hotwater["system_type"]]
|
||||
|
||||
if self.hotwater["extra_features"] == "plus solar":
|
||||
|
|
@ -1229,6 +1242,8 @@ class Property:
|
|||
self.hot_water_energy_source = assumptions.DESCRIPTIONS_TO_FUEL_TYPES[secondary_heating]["fuel"]
|
||||
else:
|
||||
raise Exception("Investiage me")
|
||||
else:
|
||||
self.hot_water_energy_source = hotwater_appliance_to_fuel[self.hotwater["appliance"]]
|
||||
|
||||
def is_ashp_valid(self, measures):
|
||||
|
||||
|
|
|
|||
|
|
@ -73,6 +73,11 @@ DESCRIPTIONS_TO_FUEL_TYPES = {
|
|||
"Electric storage heaters, Room heaters, electric": {"fuel": "Electricity", "cop": 1},
|
||||
'Boiler and underfloor heating, oil': {"fuel": "Oil", "cop": 0.85},
|
||||
"Boiler and radiators, smokeless fuel": {"fuel": "Smokeless Fuel", "cop": 0.85},
|
||||
"Boiler and radiators, mains gas, Boiler and underfloor heating, mains gas": {"fuel": "Natural Gas", "cop": 0.85},
|
||||
"Electric ceiling heating, electric": {"fuel": "Electricity", "cop": 1},
|
||||
"Air source heat pump, warm air, electric": {
|
||||
"fuel": "Electricity", "cop": AVERAGE_ASHP_EFFICIENCY / 100
|
||||
}
|
||||
}
|
||||
|
||||
# These are the measure types where if there is a ventilation recommendation, we force the inclusion of it
|
||||
|
|
|
|||
531
backend/tests/test_integration.py
Normal file
531
backend/tests/test_integration.py
Normal file
|
|
@ -0,0 +1,531 @@
|
|||
import ast
|
||||
import json
|
||||
from copy import deepcopy
|
||||
from dataclasses import replace
|
||||
from datetime import datetime
|
||||
|
||||
import random
|
||||
from tqdm import tqdm
|
||||
import pandas as pd
|
||||
import numpy as np
|
||||
from etl.epc.Record import EPCRecord
|
||||
from backend.SearchEpc import SearchEpc
|
||||
from sqlalchemy.exc import IntegrityError, OperationalError
|
||||
from sqlalchemy.orm import sessionmaker
|
||||
from starlette.responses import Response
|
||||
|
||||
from backend.app.config import get_settings, get_prediction_buckets
|
||||
from backend.app.db.connection import db_engine
|
||||
from backend.app.db.functions.materials_functions import get_materials
|
||||
from backend.app.db.functions.portfolio_functions import aggregate_portfolio_recommendations
|
||||
from backend.app.db.functions.property_functions import (
|
||||
create_property, create_property_details_epc, create_property_targets, update_property_data,
|
||||
update_or_create_property_spatial_details
|
||||
)
|
||||
from backend.app.db.functions.recommendations_functions import (
|
||||
create_plan, upload_recommendations, create_scenario
|
||||
)
|
||||
from backend.app.db.functions.funding_functions import upload_funding
|
||||
from backend.app.db.functions.energy_assessment_functions import get_latest_assessment_by_uprn
|
||||
from backend.app.db.models.portfolio import rating_lookup
|
||||
from backend.app.plan.schemas import PlanTriggerRequest, WALL_INSULATION_MEASURES, ROOF_INSULATION_MEASURES
|
||||
from backend.app.plan.utils import get_cleaned
|
||||
from backend.app.utils import sap_to_epc
|
||||
import backend.app.assumptions as assumptions
|
||||
|
||||
from backend.ml_models.api import ModelApi
|
||||
from backend.Property import Property
|
||||
from backend.apis.GoogleSolarApi import GoogleSolarApi
|
||||
|
||||
from recommendations.optimiser.CostOptimiser import CostOptimiser
|
||||
from recommendations.optimiser.GainOptimiser import GainOptimiser
|
||||
import recommendations.optimiser.optimiser_functions as optimiser_functions
|
||||
from recommendations.Recommendations import Recommendations
|
||||
from utils.logger import setup_logger
|
||||
from utils.s3 import read_dataframe_from_s3_parquet, read_csv_from_s3, read_excel_from_s3
|
||||
from backend.ml_models.Valuation import PropertyValuation
|
||||
|
||||
from etl.bill_savings.KwhData import KwhData
|
||||
from etl.spatial.OpenUprnClient import OpenUprnClient
|
||||
from etl.find_my_epc.RetrieveFindMyEpc import RetrieveFindMyEpc
|
||||
|
||||
from backend.Funding import Funding
|
||||
from recommendations.optimiser.funding_optimiser import optimise_with_funding_paths
|
||||
from recommendations.recommendation_utils import convert_thickness_to_numeric, get_wall_u_value
|
||||
|
||||
# Input data (temp)
|
||||
import pickle
|
||||
|
||||
import pandas as pd
|
||||
|
||||
with open("local_data_for_deletion.pkl", 'rb') as f:
|
||||
local_data = pickle.load(f)
|
||||
|
||||
cleaning_data = local_data["cleaning_data"]
|
||||
materials = local_data["materials"]
|
||||
cleaned = local_data["cleaned"]
|
||||
project_scores_matrix = local_data["project_scores_matrix"]
|
||||
partial_project_scores_matrix = local_data["partial_project_scores_matrix"]
|
||||
whlg_eligible_postcodes = local_data["whlg_eligible_postcodes"]
|
||||
|
||||
with open("kwh_client_for_deletion.pkl", "rb") as f:
|
||||
kwh_client = pickle.load(f)
|
||||
|
||||
epc_data = pd.read_csv(
|
||||
"/Users/khalimconn-kowlessar/Downloads/all-domestic-certificates/domestic-E06000002-Middlesbrough/certificates.csv",
|
||||
low_memory=False
|
||||
)
|
||||
|
||||
# TODO: Store this for cleaning
|
||||
costs_by_floor_area = epc_data[
|
||||
pd.to_datetime(epc_data["LODGEMENT_DATE"]) >= "2024-01-01"
|
||||
][["TOTAL_FLOOR_AREA", "CURRENT_ENERGY_EFFICIENCY", "LIGHTING_COST_CURRENT", "HEATING_COST_CURRENT",
|
||||
"HOT_WATER_COST_CURRENT"]].copy()
|
||||
|
||||
costs_by_floor_area.columns = [c.lower().replace("_", "-") for c in costs_by_floor_area.columns]
|
||||
for c in ["lighting-cost-current", "heating-cost-current", "hot-water-cost-current"]:
|
||||
costs_by_floor_area[c + "_scaled"] = costs_by_floor_area[c] / costs_by_floor_area["total-floor-area"]
|
||||
|
||||
costs_by_floor_area = costs_by_floor_area.groupby("current-energy-efficiency")[
|
||||
["lighting-cost-current_scaled", "heating-cost-current_scaled", "hot-water-cost-current_scaled"]
|
||||
].mean().reset_index()
|
||||
|
||||
sample_epc_data = epc_data[pd.to_datetime(epc_data["LODGEMENT_DATE"]) >= "2015-01-01"].drop_duplicates("UPRN").sample(
|
||||
1000).reset_index(drop=True)
|
||||
|
||||
# TODO: In Property find_energy_sources, sort out biomass community heating - what fuel type
|
||||
# TODO: We might be able to remove find_energy_sources entirely and remove estimate_electrical_consumption. It's used
|
||||
# in the google solar api but is it really needed? I don't think it's super accurate. It might be better to
|
||||
# just use an average energy consumption by floor area for UK households?
|
||||
# Load the input properties
|
||||
input_properties = []
|
||||
for row_id, config in tqdm(sample_epc_data.iterrows(), total=len(sample_epc_data)):
|
||||
epc = {
|
||||
k.lower().replace("_", "-"): v if not pd.isnull(v) else None for k, v in config.items()
|
||||
}
|
||||
# Avoid the data load inside of EPCRecord - something we should pull out
|
||||
for x in ["number-habitable-rooms", "floor-height", "number-heated-rooms"]:
|
||||
if pd.isnull(epc[x]):
|
||||
if x == "floor-height":
|
||||
epc[x] = 2.4
|
||||
if x == "number-habitable-rooms":
|
||||
epc[x] = 3
|
||||
if x == "number-heated-rooms":
|
||||
epc[x] = 3
|
||||
|
||||
epc_records = {'original_epc': epc, 'full_sap_epc': {}, 'old_data': []}
|
||||
|
||||
prepared_epc = EPCRecord(
|
||||
epc_records=epc_records,
|
||||
run_mode="newdata",
|
||||
cleaning_data=cleaning_data,
|
||||
)
|
||||
|
||||
input_properties.append(
|
||||
Property(
|
||||
id=row_id,
|
||||
is_new=True,
|
||||
address=epc["address"],
|
||||
postcode=epc["postcode"],
|
||||
epc_record=prepared_epc,
|
||||
already_installed={},
|
||||
property_valuation={},
|
||||
non_invasive_recommendations=[],
|
||||
energy_assessment=None,
|
||||
**Property.extract_kwargs(config), # TODO: Depraecate this
|
||||
)
|
||||
)
|
||||
|
||||
# For each property, insert the default solar configuration
|
||||
for p in tqdm(input_properties):
|
||||
solar_api = GoogleSolarApi(
|
||||
api_key=None, solar_materials=[m for m in materials if m["type"] == "solar_pv"], max_retries=5
|
||||
)
|
||||
panel_performance = solar_api.default_panel_performance(property_instance=p)
|
||||
p.set_solar_panel_configuration(
|
||||
solar_panel_configuration={
|
||||
"insights_data": None, "panel_performance": panel_performance, "unit_share_of_energy": 1
|
||||
},
|
||||
)
|
||||
|
||||
# We mock kwh preds
|
||||
mocked_kwh_predictions = {"heating_kwh_predictions": [], "hotwater_kwh_predictions": []}
|
||||
for p in tqdm(input_properties):
|
||||
mocked_kwh_predictions["heating_kwh_predictions"].append({
|
||||
"id": p.uprn, "predictions": random.sample(range(100, 3000), 1)[0]
|
||||
})
|
||||
mocked_kwh_predictions["hotwater_kwh_predictions"].append({
|
||||
"id": p.uprn, "predictions": random.sample(range(100, 3000), 1)[0]
|
||||
})
|
||||
mocked_kwh_predictions["heating_kwh_predictions"] = pd.DataFrame(mocked_kwh_predictions["heating_kwh_predictions"])
|
||||
mocked_kwh_predictions["hotwater_kwh_predictions"] = pd.DataFrame(mocked_kwh_predictions["hotwater_kwh_predictions"])
|
||||
|
||||
# TODO: We might want to implement this generally, via an ETL process
|
||||
for p in input_properties:
|
||||
for col in ["lighting-cost-current", "heating-cost-current", "hot-water-cost-current"]:
|
||||
if pd.isnull(p.data[col]):
|
||||
min_diff = abs(
|
||||
(costs_by_floor_area["current-energy-efficiency"] - p.data["current-energy-efficiency"])
|
||||
).min()
|
||||
df = costs_by_floor_area[
|
||||
abs((costs_by_floor_area["current-energy-efficiency"] - p.data[
|
||||
"current-energy-efficiency"])) == min_diff
|
||||
]
|
||||
if df.shape[0] > 1:
|
||||
df = df.head(1)
|
||||
p.data[col] = (df[col + "_scaled"] * p.data["total-floor-area"]).values[0]
|
||||
|
||||
[
|
||||
p.set_features(cleaned=cleaned, kwh_client=kwh_client, kwh_predictions=mocked_kwh_predictions) for p in
|
||||
input_properties
|
||||
]
|
||||
# for p in input_properties:
|
||||
# p.set_features(cleaned=cleaned, kwh_client=kwh_client, kwh_predictions=mocked_kwh_predictions)
|
||||
|
||||
# Run the recommendations
|
||||
recommendations = {}
|
||||
recommendations_scoring_data = []
|
||||
representative_recommendations = {}
|
||||
for p in tqdm(input_properties):
|
||||
if p.data["property-type"] == "House" and pd.isnull(p.data["built-form"]):
|
||||
p.data["built-form"] = "Semi-Detached"
|
||||
recommender = Recommendations(
|
||||
property_instance=p,
|
||||
materials=materials,
|
||||
exclusions=[],
|
||||
inclusions=[],
|
||||
default_u_values=True
|
||||
)
|
||||
property_recommendations, property_representative_recommendations = recommender.recommend()
|
||||
|
||||
if not property_recommendations:
|
||||
continue
|
||||
|
||||
recommendations[p.id] = property_recommendations
|
||||
representative_recommendations[p.id] = property_representative_recommendations
|
||||
|
||||
p.create_base_difference_epc_record(cleaned_lookup=cleaned)
|
||||
p.adjust_difference_record_with_recommendations(
|
||||
property_recommendations, property_representative_recommendations
|
||||
)
|
||||
|
||||
recommendations_scoring_data.extend(p.recommendations_scoring_data)
|
||||
|
||||
recommendations_scoring_data = pd.DataFrame(recommendations_scoring_data)
|
||||
recommendations_scoring_data = recommendations_scoring_data.drop(
|
||||
columns=[
|
||||
"rdsap_change", "heat_demand_change", "carbon_change", "sap_ending", "heat_demand_ending",
|
||||
"carbon_ending"
|
||||
]
|
||||
)
|
||||
|
||||
model_predictions_mocked = {
|
||||
"sap_change_predictions": None,
|
||||
"heat_demand_predictions": None,
|
||||
"carbon_change_predictions": None,
|
||||
"heating_kwh_predictions": None,
|
||||
"hotwater_kwh_predictions": None,
|
||||
}
|
||||
|
||||
for k in model_predictions_mocked.keys():
|
||||
model_predictions_mocked[k] = recommendations_scoring_data[["id"]].copy()
|
||||
model_predictions_mocked[k][['property_id', 'recommendation_id']] = (
|
||||
model_predictions_mocked[k]['id'].str.split('+', expand=True)
|
||||
)
|
||||
model_predictions_mocked[k]['phase'] = model_predictions_mocked[k]['recommendation_id'].apply(
|
||||
ModelApi.extract_phase)
|
||||
|
||||
if k in ["heating_kwh_predictions", "hotwater_kwh_predictions"]:
|
||||
model_predictions_mocked[k]["predictions"] = random.choices(range(100, 3000),
|
||||
k=len(recommendations_scoring_data))
|
||||
continue
|
||||
|
||||
model_predictions_mocked[k] = model_predictions_mocked[k].sort_values(["property_id", "phase"], ascending=True)
|
||||
preds = []
|
||||
for p_id in model_predictions_mocked[k]["property_id"].unique():
|
||||
# We add some amount each time
|
||||
p = [p for p in input_properties if str(p.id) == p_id][0]
|
||||
if k == "sap_change_predictions":
|
||||
start = p.data["current-energy-efficiency"]
|
||||
elif k == "heat_demand_predictions":
|
||||
start = p.data["energy-consumption-current"]
|
||||
else:
|
||||
start = p.data["co2-emissions-current"]
|
||||
df = model_predictions_mocked[k][model_predictions_mocked[k]["property_id"] == p_id].copy()
|
||||
# Add some amount each time
|
||||
to_add = random.choices(range(0, 15), k=len(df))
|
||||
to_add = np.cumsum(to_add)
|
||||
df["predictions"] = start + to_add
|
||||
preds.append(df)
|
||||
preds = pd.concat(preds)
|
||||
model_predictions_mocked[k] = preds
|
||||
|
||||
for property_id in tqdm(recommendations.keys(), total=len(recommendations)):
|
||||
property_instance = [p for p in input_properties if p.id == property_id][0]
|
||||
|
||||
recommendations_with_impact, impact_summary = (
|
||||
Recommendations.calculate_recommendation_impact(
|
||||
property_instance=property_instance,
|
||||
all_predictions=model_predictions_mocked,
|
||||
recommendations=recommendations,
|
||||
representative_recommendations=representative_recommendations
|
||||
)
|
||||
)
|
||||
|
||||
# We use the impact_summary to update the simulation_epcs with the new SAP, heat demand, carbon, cost etc
|
||||
# at each phase
|
||||
property_instance.update_simulation_epcs(impact_summary)
|
||||
recommendations[property_id] = recommendations_with_impact
|
||||
|
||||
for property_id in tqdm([p.id for p in input_properties]):
|
||||
property_recommendations = recommendations.get(property_id, [])
|
||||
property_instance = [p for p in input_properties if p.id == property_id][0]
|
||||
|
||||
property_current_energy_bill = (
|
||||
Recommendations.calculate_recommendation_tenant_savings(
|
||||
property_instance=property_instance,
|
||||
kwh_simulation_predictions=model_predictions_mocked,
|
||||
property_recommendations=property_recommendations,
|
||||
ashp_cop=2.8
|
||||
)
|
||||
)
|
||||
property_instance.current_energy_bill = property_current_energy_bill
|
||||
|
||||
body = PlanTriggerRequest(
|
||||
**{'budget': None, 'goal': 'Increasing EPC', 'housing_type': 'Social', 'goal_value': 'B', 'portfolio_id': 0,
|
||||
'trigger_file_path': '', 'already_installed_file_path': '',
|
||||
'patches_file_path': None, 'non_invasive_recommendations_file_path': None,
|
||||
'valuation_file_path': '',
|
||||
'required_measures': [], 'scenario_name': 'EPC B', 'scenario_id': None,
|
||||
'multi_plan': True, 'optimise': True, 'default_u_values': True, 'ashp_cop': 2.8,
|
||||
'event_type': 'remote_assessment', 'simulate_sap_10': False, 'file_type': None, 'file_format': None,
|
||||
'sheet_name': None, 'sheet_count': None, 'index_start': None, 'index_end': None}
|
||||
)
|
||||
|
||||
for p in tqdm(input_properties):
|
||||
if not recommendations.get(p.id):
|
||||
continue
|
||||
|
||||
# we need to double unlist because we have a list of lists
|
||||
property_measure_types = {rec["type"] for recs in recommendations[p.id] for rec in recs}
|
||||
property_required_measures = [m for m in recommendations[p.id] if m[0]["type"] in body.required_measures]
|
||||
measures_to_optimise = [m for m in recommendations[p.id] if m[0]["type"] not in body.required_measures]
|
||||
|
||||
# If a measure requiring ventilation is selected, and the property does not have ventilation, we enfore
|
||||
# its inclusion
|
||||
needs_ventilation = any(
|
||||
x in property_measure_types for x in assumptions.measures_needing_ventilation
|
||||
) and not p.has_ventilation
|
||||
|
||||
if not measures_to_optimise:
|
||||
# Nothing to do, we just reshape the recommendations
|
||||
recommendations[p.id] = optimiser_functions.flatten_recommendations_with_defaults(
|
||||
p.id, recommendations, set()
|
||||
)
|
||||
continue
|
||||
|
||||
fixed_gain = optimiser_functions.calculate_fixed_gain(
|
||||
property_required_measures, recommendations, p, needs_ventilation
|
||||
)
|
||||
gain = optimiser_functions.calculate_gain(body=body, p=p, fixed_gain=fixed_gain)
|
||||
|
||||
funding = Funding(
|
||||
tenure="Social",
|
||||
project_scores_matrix=project_scores_matrix,
|
||||
partial_project_scores_matrix=partial_project_scores_matrix,
|
||||
whlg_eligible_postcodes=whlg_eligible_postcodes,
|
||||
eco4_social_cavity_abs_rate=12.5,
|
||||
eco4_social_solid_abs_rate=17,
|
||||
eco4_private_cavity_abs_rate=12.5,
|
||||
eco4_private_solid_abs_rate=17,
|
||||
gbis_social_cavity_abs_rate=21,
|
||||
gbis_social_solid_abs_rate=25,
|
||||
gbis_private_cavity_abs_rate=21,
|
||||
gbis_private_solid_abs_rate=28,
|
||||
)
|
||||
|
||||
li_thickness = convert_thickness_to_numeric(
|
||||
p.roof["insulation_thickness"], p.roof["is_pitched"], p.roof["is_flat"]
|
||||
)
|
||||
current_wall_u_value = p.walls["thermal_transmittance"]
|
||||
if current_wall_u_value is None:
|
||||
current_wall_u_value = get_wall_u_value(
|
||||
clean_description=p.walls["clean_description"],
|
||||
age_band=p.age_band,
|
||||
is_granite_or_whinstone=p.walls["is_granite_or_whinstone"],
|
||||
is_sandstone_or_limestone=p.walls["is_sandstone_or_limestone"],
|
||||
)
|
||||
|
||||
# We insert the innovation uplift
|
||||
measures_to_optimise_with_uplift = deepcopy(measures_to_optimise)
|
||||
|
||||
# TODO: Turn this into a function and store the innovaiton uplift
|
||||
for group in measures_to_optimise_with_uplift:
|
||||
for r in group:
|
||||
|
||||
if r["type"] in ["mechanical_ventilation", "low_energy_lighting", "secondary_heating",
|
||||
"extension_cavity_wall_insulation", "draught_proofing", "sealing_open_fireplace"]:
|
||||
(
|
||||
r["partial_project_score"],
|
||||
r["partial_project_funding"],
|
||||
r["innovation_uplift"],
|
||||
r["uplift_project_score"],
|
||||
) = (
|
||||
0, 0, 0, 0
|
||||
)
|
||||
continue
|
||||
|
||||
(
|
||||
r["partial_project_score"], r["partial_project_funding"], r["innovation_uplift"],
|
||||
r["uplift_project_score"]
|
||||
) = funding.get_innovation_uplift(
|
||||
measure=r,
|
||||
starting_sap=p.data["current-energy-efficiency"],
|
||||
floor_area=p.floor_area,
|
||||
is_cavity=p.walls["is_cavity_wall"],
|
||||
current_wall_uvalue=current_wall_u_value,
|
||||
is_partial="partial" in p.walls["clean_description"].lower(),
|
||||
existing_li_thickness=li_thickness,
|
||||
mainheating=p.main_heating,
|
||||
main_fuel=p.main_fuel,
|
||||
mainheat_energy_eff=p.data["mainheat-energy-eff"],
|
||||
)
|
||||
|
||||
input_measures = optimiser_functions.prepare_input_measures(
|
||||
measures_to_optimise_with_uplift, body.goal, needs_ventilation, funding=True
|
||||
)
|
||||
|
||||
# When the goal is Increasing EPC, we can run the funding optimiser
|
||||
if body.goal == "Increasing EPC":
|
||||
|
||||
solutions = optimise_with_funding_paths(
|
||||
p=p,
|
||||
input_measures=input_measures,
|
||||
housing_type=body.housing_type,
|
||||
budget=body.budget,
|
||||
target_gain=gain,
|
||||
funding=funding
|
||||
)
|
||||
|
||||
# Given the solutions we select the optimal one
|
||||
solutions["cost_less_full_project_funding"] = np.where(
|
||||
solutions["scheme"] == "eco4",
|
||||
solutions["total_cost"] - solutions["full_project_funding"] - solutions["total_uplift"],
|
||||
solutions["total_cost"] - solutions["partial_project_funding"] - solutions["total_uplift"]
|
||||
)
|
||||
|
||||
solutions["cost_less_full_project_funding"] = (
|
||||
solutions["total_cost"] - solutions["full_project_funding"] - solutions["total_uplift"]
|
||||
)
|
||||
solutions = solutions.sort_values("cost_less_full_project_funding", ascending=True)
|
||||
|
||||
if solutions["meets_upgrade_target"].any():
|
||||
# If we have a solution that meets the upgrade target, we select that one
|
||||
optimal_solution = solutions[solutions["meets_upgrade_target"]].iloc[0]
|
||||
else:
|
||||
# Pick the cheapest
|
||||
optimal_solution = solutions.iloc[0]
|
||||
|
||||
# This is the list of measures that we will recommend
|
||||
scheme = optimal_solution["scheme"]
|
||||
funded_measures = optimal_solution["items"] if scheme != "none" else []
|
||||
solution = optimal_solution["items"] + optimal_solution["unfunded_items"]
|
||||
# This is the total amount of funding that the project will produce (including uplifts) (£)
|
||||
project_funding = optimal_solution["full_project_funding"] if scheme == "eco4" else \
|
||||
optimal_solution["partial_project_funding"]
|
||||
# This is the total amount of funding associated to the uplift (£)
|
||||
total_uplift = optimal_solution["total_uplift"]
|
||||
# This is the funding scheme selected
|
||||
# This is the full project ABS
|
||||
full_project_score = optimal_solution["project_score"]
|
||||
# This is the partial project ABS
|
||||
partial_project_score = optimal_solution["partial_project_score"]
|
||||
# This is the uplift score ABS
|
||||
uplift_project_score = optimal_solution["total_uplift_score"]
|
||||
else:
|
||||
# We optimise and then we determine eligibility for funding, based on the measures selected
|
||||
optimiser = (
|
||||
GainOptimiser(
|
||||
input_measures, max_cost=body.budget, max_gain=gain, allow_slack=False
|
||||
) if body.budget else CostOptimiser(input_measures, min_gain=gain)
|
||||
)
|
||||
optimiser.setup()
|
||||
optimiser.solve()
|
||||
solution = optimiser.solution
|
||||
|
||||
recommendation_types = []
|
||||
for measures in input_measures:
|
||||
for measure in measures:
|
||||
recommendation_types.append(measure["type"])
|
||||
recommendation_types = set(recommendation_types)
|
||||
|
||||
has_wall_insulation_recommendation = any(
|
||||
(m in recommendation_types or "+".join([m, "mechanical_ventilation"])) for m in
|
||||
WALL_INSULATION_MEASURES
|
||||
)
|
||||
has_roof_insulation_recommendation = any(
|
||||
(m in recommendation_types or "+".join([m, "mechanical_ventilation"])) for m in
|
||||
ROOF_INSULATION_MEASURES
|
||||
)
|
||||
|
||||
funding.check_funding(
|
||||
measures=solution,
|
||||
starting_sap=p.data["current-energy-efficiency"],
|
||||
ending_sap=p.data["current-energy-efficiency"] + sum([x["gain"] for x in solution]),
|
||||
floor_area=p.floor_area,
|
||||
mainheat_description=p.main_heating["clean_description"],
|
||||
heating_control_description=p.main_heating_controls["clean_description"],
|
||||
is_cavity=p.walls["is_cavity_wall"],
|
||||
current_wall_uvalue=current_wall_u_value,
|
||||
is_partial="partial" in p.walls["clean_description"].lower(),
|
||||
existing_li_thickness=li_thickness,
|
||||
mainheating=p.main_heating,
|
||||
main_fuel=p.main_fuel,
|
||||
mainheat_energy_eff=p.data["mainheat-energy-eff"],
|
||||
has_wall_insulation_recommendation=has_wall_insulation_recommendation,
|
||||
has_roof_insulation_recommendation=has_roof_insulation_recommendation,
|
||||
)
|
||||
|
||||
# Determine the scheme
|
||||
scheme = "none"
|
||||
if funding.eco4_eligible:
|
||||
scheme = "eco4"
|
||||
if scheme == "none" and funding.gbis_eligible:
|
||||
scheme = "gbis"
|
||||
|
||||
funded_measures = solution if scheme in ["gbis", "eco4"] else []
|
||||
project_funding = 0 if funding.full_project_abs is not None else funding.full_project_abs
|
||||
total_uplift = funding.eco4_uplift
|
||||
full_project_score = 0 if funding.full_project_abs is not None else funding.full_project_abs
|
||||
partial_project_score = funding.partial_project_abs
|
||||
uplift_project_score = funding.eco4_uplift if scheme == "eco4" else funding.gbis_uplift
|
||||
|
||||
selected = {r["id"] for r in solution}
|
||||
|
||||
if property_required_measures:
|
||||
solution = optimiser_functions.add_required_measures(
|
||||
property_id=p.id, property_required_measures=property_required_measures,
|
||||
recommendations=recommendations, selected=selected,
|
||||
)
|
||||
|
||||
# Add best practice measures (ventilation/trickle vents)
|
||||
selected = optimiser_functions.add_best_practice_measures(p.id, solution, recommendations, selected)
|
||||
# Final flattening - Don't do this!
|
||||
# recommendations[p.id] = optimiser_functions.flatten_recommendations_with_defaults(
|
||||
# p.id, recommendations, selected
|
||||
# )
|
||||
|
||||
# TODO: functionise
|
||||
for measure in funded_measures:
|
||||
if "+mechanical_ventilation" in measure["type"]:
|
||||
measure["type"] = measure["type"].split("+mechanical_ventilation")[0]
|
||||
|
||||
p.insert_funding(
|
||||
scheme=scheme,
|
||||
funded_measures=funded_measures,
|
||||
project_funding=project_funding,
|
||||
total_uplift=total_uplift,
|
||||
full_project_score=full_project_score,
|
||||
partial_project_score=partial_project_score,
|
||||
uplift_project_score=uplift_project_score
|
||||
)
|
||||
|
|
@ -1,7 +1,6 @@
|
|||
from pathlib import Path
|
||||
import numpy as np
|
||||
import pandas as pd
|
||||
from BaseUtility import Definitions
|
||||
from etl.epc.settings import (
|
||||
DATA_PROCESSOR_SETTINGS,
|
||||
EARLIEST_EPC_DATE,
|
||||
|
|
@ -22,6 +21,7 @@ from etl.epc.settings import (
|
|||
ENDING_SUFFIX_COMPONENT_COLS,
|
||||
POTENTIAL_COLUMNS,
|
||||
EFFICIENCY_FEATURES,
|
||||
DATA_ANOMALY_MATCHES
|
||||
)
|
||||
from recommendations.rdsap_tables import FLOOR_LEVEL_MAP
|
||||
|
||||
|
|
@ -247,8 +247,7 @@ class EPCDataProcessor:
|
|||
# Map all anomaly values to None
|
||||
data_anomaly_map = dict(
|
||||
zip(
|
||||
Definitions.DATA_ANOMALY_MATCHES,
|
||||
[None] * len(Definitions.DATA_ANOMALY_MATCHES),
|
||||
DATA_ANOMALY_MATCHES, [None] * len(DATA_ANOMALY_MATCHES),
|
||||
)
|
||||
)
|
||||
|
||||
|
|
@ -283,7 +282,7 @@ class EPCDataProcessor:
|
|||
@staticmethod
|
||||
def clean_construction_age_band(x):
|
||||
# Firstly, we check if it's an error value
|
||||
if x in Definitions.DATA_ANOMALY_MATCHES or x in [None, np.nan]:
|
||||
if x in DATA_ANOMALY_MATCHES or x in [None, np.nan]:
|
||||
return x
|
||||
|
||||
# Next, we check if it's a value in our map
|
||||
|
|
|
|||
|
|
@ -593,6 +593,15 @@ class EPCRecord:
|
|||
self.prepared_epc["total-floor-area"]
|
||||
)
|
||||
|
||||
# We handle the edge case of floor area being 0. We set it to zero and it is cleaned by
|
||||
# _clean_with_data_processor
|
||||
if self.prepared_epc['total-floor-area'] == 0:
|
||||
print(
|
||||
"Edge case of floor area being zero - will set to none and will be cleaned in "
|
||||
"_clean_with_data_processor"
|
||||
)
|
||||
self.prepared_epc['total-floor-area'] = None
|
||||
|
||||
def _clean_mains_gas(self):
|
||||
"""
|
||||
This method will clean the mains gas, if empty or invalid
|
||||
|
|
@ -668,7 +677,7 @@ class EPCRecord:
|
|||
|
||||
for attribute in fields:
|
||||
value = self.prepared_epc[attribute]
|
||||
if value in DATA_ANOMALY_MATCHES:
|
||||
if value in DATA_ANOMALY_MATCHES or pd.isnull(value):
|
||||
if attribute in null_attributes:
|
||||
value = None
|
||||
else:
|
||||
|
|
@ -751,6 +760,8 @@ class EPCRecord:
|
|||
if self.prepared_epc["built-form"] in DATA_ANOMALY_MATCHES:
|
||||
if self.prepared_epc["property-type"] in ["Flat", "Maisonette"]:
|
||||
self.prepared_epc["built-form"] = "End-Terrace"
|
||||
else:
|
||||
self.prepared_epc["built-form"] = "Semi-Detached"
|
||||
|
||||
def _clean_age_band(self):
|
||||
"""
|
||||
|
|
|
|||
|
|
@ -48,6 +48,8 @@ DATA_ANOMALY_MATCHES = {
|
|||
None,
|
||||
# An older value which rarely shows up but has been seen in the data.
|
||||
"UNKNOWN",
|
||||
#
|
||||
"Unknown"
|
||||
}
|
||||
|
||||
DATA_ANOMALY_SUBSTRINGS = {
|
||||
|
|
|
|||
|
|
@ -20,6 +20,7 @@ class HotWaterAttributes(Definitions):
|
|||
'solid fuel range cooker',
|
||||
'room heaters', # Generic/unspecified category
|
||||
'electric multipoint',
|
||||
'single-point gas',
|
||||
]
|
||||
|
||||
# SYSTEM_TYPES refer to the larger system within which the heater operates.
|
||||
|
|
@ -29,6 +30,7 @@ class HotWaterAttributes(Definitions):
|
|||
# The hot water is provided by a secondary (or supplementary) heating system in the building
|
||||
'from second main heating system', # Same as 'from secondary system'
|
||||
'community scheme', # The hot water is provided by a community heating system
|
||||
"water heater",
|
||||
]
|
||||
|
||||
# THERMOSTAT_CHARACTERISTICS refer to features related to temperature control in the system.
|
||||
|
|
|
|||
|
|
@ -28,6 +28,9 @@ class LightingAttributes(Definitions):
|
|||
self.nodata = (not description) or (description in self.DATA_ANOMALY_MATCHES) or (
|
||||
description in self.OBSERVED_ERRORS) or (description == "SAP05:Lighting")
|
||||
|
||||
if description == "SAP05:Lighting":
|
||||
self.description = description # Reset self.description
|
||||
|
||||
def welsh_translation_search(self):
|
||||
"""
|
||||
For welsh text describing the percentage of low energy lighting, we match the regular
|
||||
|
|
|
|||
|
|
@ -128,6 +128,7 @@ class MainheatControlAttributes(Definitions):
|
|||
]
|
||||
|
||||
def __init__(self, description: str):
|
||||
|
||||
self.description: str = clean_description(description.lower()).strip()
|
||||
self.nodata = not self.description or description in self.DATA_ANOMALY_MATCHES or (
|
||||
description in self.NO_DATA_DESCRIPTIONS
|
||||
|
|
|
|||
|
|
@ -17,5 +17,5 @@ all_cleaner_map = {
|
|||
'roof-description': RoofAttributes,
|
||||
'walls-description': WallAttributes,
|
||||
'windows-description': WindowAttributes,
|
||||
'lighting-description:': LightingAttributes,
|
||||
'lighting-description': LightingAttributes,
|
||||
}
|
||||
|
|
|
|||
|
|
@ -222,6 +222,11 @@ hotwater_cases = [
|
|||
{'original_description': 'Electric multipoint', 'heater_type': 'electric multipoint', 'system_type': None,
|
||||
'thermostat_characteristics': None,
|
||||
'heating_scope': None, 'energy_recovery': None, 'tariff_type': None, 'extra_features': None, 'chp_systems': None,
|
||||
'distribution_system': None, 'no_system_present': None, 'appliance': None, 'assumed': False}
|
||||
'distribution_system': None, 'no_system_present': None, 'appliance': None, 'assumed': False},
|
||||
{'original_description': 'Single-point gas water heater, standard tariff',
|
||||
'heater_type': 'single-point gas', 'system_type': "water heater", 'thermostat_characteristics': None,
|
||||
'heating_scope': None, 'energy_recovery': None, 'tariff_type': 'standard tariff', 'extra_features': None,
|
||||
'chp_systems': None, 'distribution_system': None, 'no_system_present': None, 'appliance': None
|
||||
}
|
||||
|
||||
]
|
||||
|
|
|
|||
|
|
@ -82,6 +82,14 @@ class HeatingRecommender:
|
|||
"controls_prefix": ""
|
||||
},
|
||||
"dual": None
|
||||
},
|
||||
'Electric storage heaters, room heaters, electric': {
|
||||
"hhr": {
|
||||
"mainheating_description": "Electric storage heaters, radiators",
|
||||
"recommendation_description": "Install high heat retention electric storage heaters.",
|
||||
"controls_prefix": ""
|
||||
},
|
||||
"dual": None
|
||||
}
|
||||
}
|
||||
|
||||
|
|
|
|||
|
|
@ -693,6 +693,7 @@ class Recommendations:
|
|||
|
||||
if hotwater_description in [
|
||||
"From main system", "From main system, no cylinder thermostat",
|
||||
'From main system, waste water heat recovery'
|
||||
]:
|
||||
return {
|
||||
"heating_fuel_type": heating_fuel, "hotwater_fuel_type": heating_fuel,
|
||||
|
|
|
|||
|
|
@ -581,7 +581,7 @@ class RoofRecommendations:
|
|||
**cost_result,
|
||||
"already_installed": already_installed,
|
||||
"survey": rir_non_invasive_recommendation.get("survey", None),
|
||||
"innovation_rate": material.to_dict()["innovation_rate"]
|
||||
"innovation_rate": material.innovation_rate
|
||||
}
|
||||
)
|
||||
|
||||
|
|
|
|||
|
|
@ -66,6 +66,7 @@ class WallRecommendations(Definitions):
|
|||
"Solid brick, as built, partial insulation": "Solid brick, with external insulation",
|
||||
"Cob, as built": "Cob, with external insulation",
|
||||
"System built, as built, no insulation": "System built, with external insulation",
|
||||
'System built, as built, partial insulation': "System built, with external insulation",
|
||||
"Granite or whinstone, as built, no insulation": 'Granite or whinstone, with external insulation',
|
||||
"Timber frame, as built, no insulation": "Timber frame, with external insulation",
|
||||
'Timber frame, as built, partial insulation': 'Timber frame, with external insulation',
|
||||
|
|
@ -81,6 +82,7 @@ class WallRecommendations(Definitions):
|
|||
"Solid brick, as built, partial insulation": "Solid brick, with internal insulation",
|
||||
"Cob, as built": "Cob, with internal insulation",
|
||||
"System built, as built, no insulation": "System built, with internal insulation",
|
||||
'System built, as built, partial insulation': "System built, with internal insulation",
|
||||
"Granite or whinstone, as built, no insulation": 'Granite or whinstone, with internal insulation',
|
||||
"Timber frame, as built, no insulation": "Timber frame, with internal insulation",
|
||||
'Timber frame, as built, partial insulation': 'Timber frame, with internal insulation',
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue