diff --git a/etl/customers/stonewater/shdf_3_clustering.py b/etl/customers/stonewater/shdf_3_clustering.py index 18cfee79..efa999e3 100644 --- a/etl/customers/stonewater/shdf_3_clustering.py +++ b/etl/customers/stonewater/shdf_3_clustering.py @@ -2371,6 +2371,10 @@ def updated_version(): asset_list_with_archetypes = asset_list.merge( assigned_clusters[["internal_id", "cluster", "archetype_representative", "rank"]], how="left", on="internal_id" + ).merge( + master_sheet_clustering_features[["Address ID", "Property Type", "Walls", "Roofs", "Heating"]], + how="left", + on="Address ID" ) # We populate the reasons for no archetype @@ -2410,7 +2414,7 @@ def updated_version(): asset_list_with_archetypes["archetype_representative"].fillna(False) ) - asset_list_with_archetypes.to_csv("Stonewater asset list with archetypes V3.csv", index=False) + asset_list_with_archetypes.to_csv("Stonewater asset list with archetypes V3.1.csv", index=False) # Produce the archetyping features archetyping_features_csv = assigned_clusters[