Merge pull request #1112 from Hestia-Homes/main

epc token
Merge pull request #1111 from Hestia-Homes/feature/address2uprn_quick_fix
2026-06-30 13:10:47 +00:00 · 2026-05-20 16:48:11 +01:00 · 2026-05-20 16:46:58 +01:00 · 2026-05-20 15:43:41 +00:00 · 2026-05-20 16:26:48 +01:00 · 2026-05-20 16:26:07 +01:00
204 changed files with 3446 additions and 123 deletions
--- a/.dockerignore
+++ b/.dockerignore
@ -6,7 +6,7 @@ backend/.idea/*
 backend/.env
 recommendations/tests/*
 model_data/tests/*
-infrastructure/*
+deployment/*
 data_collection/*
 node_modules/*
 conservation_areas/*
--- a/.github/workflows/_build_image.yml
+++ b/.github/workflows/_build_image.yml
@ -40,6 +40,8 @@ on:
        required: false
      EPC_AUTH_TOKEN:
        required: false
+      OPEN_EPC_API_TOKEN:
+        required: false

 jobs:
  build:
@ -50,6 +52,7 @@ jobs:
      DEV_DB_PORT: ${{ secrets.DEV_DB_PORT }}
      DEV_DB_NAME: ${{ secrets.DEV_DB_NAME }}
      EPC_AUTH_TOKEN: ${{ secrets.EPC_AUTH_TOKEN }}
+      OPEN_EPC_API_TOKEN: ${{ secrets.OPEN_EPC_API_TOKEN }}

    outputs:
      image_digest: ${{ steps.digest.outputs.image_digest }}
--- a/.github/workflows/deploy_terraform.yml
+++ b/.github/workflows/deploy_terraform.yml
@ -62,20 +62,20 @@ jobs:
      - uses: hashicorp/setup-terraform@v3

      - name: Terraform Init
-        working-directory: infrastructure/terraform/shared
+        working-directory: deployment/terraform/shared
        run: terraform init -reconfigure

      - name: Terraform Workspace
-        working-directory: infrastructure/terraform/shared
+        working-directory: deployment/terraform/shared
        run: terraform workspace select ${STAGE} || terraform workspace new ${STAGE}

      - name: Terraform Plan
-        working-directory: infrastructure/terraform/shared
+        working-directory: deployment/terraform/shared
        run: terraform plan -var-file=${STAGE}.tfvars -out=tfplan

      - name: Terraform Apply
        if: env.TERRAFORM_APPLY == 'true'
-        working-directory: infrastructure/terraform/shared
+        working-directory: deployment/terraform/shared
        run: terraform apply -auto-approve tfplan

  # ============================================================
@ -101,7 +101,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: ara_engine
-      lambda_path: infrastructure/terraform/lambda/engine
+      lambda_path: deployment/terraform/lambda/engine
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: engine-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.ara_engine_image.outputs.image_digest }}
@ -133,6 +133,7 @@ jobs:
        DEV_DB_PORT=$DEV_DB_PORT
        DEV_DB_NAME=$DEV_DB_NAME
        EPC_AUTH_TOKEN=$EPC_AUTH_TOKEN
+        OPEN_EPC_API_TOKEN=$OPEN_EPC_API_TOKEN
    secrets:
      AWS_ACCESS_KEY_ID: ${{ secrets.DEV_AWS_ACCESS_KEY_ID }}
      AWS_SECRET_ACCESS_KEY: ${{ secrets.DEV_AWS_SECRET_ACCESS_KEY }}
@ -141,6 +142,7 @@ jobs:
      DEV_DB_PORT: ${{ secrets.DEV_DB_PORT }}
      DEV_DB_NAME: ${{ secrets.DEV_DB_NAME }}
      EPC_AUTH_TOKEN: ${{ secrets.DEV_EPC_AUTH_TOKEN }}
+      OPEN_EPC_API_TOKEN: ${{ secrets.DEV_OPEN_EPC_API_TOKEN }}

  # ============================================================
  # Deploy Address 2 UPRN Lambda
@ -150,7 +152,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: address2uprn
-      lambda_path: infrastructure/terraform/lambda/address2UPRN
+      lambda_path: deployment/terraform/lambda/address2UPRN
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: address2uprn-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.address2uprn_image.outputs.image_digest }}
@ -169,7 +171,7 @@ jobs:
    uses: ./.github/workflows/_build_image.yml
    with:
      ecr_repo: postcode_splitter-${{ needs.determine_stage.outputs.stage }}
-      dockerfile_path: backend/postcode_splitter/handler/Dockerfile
+      dockerfile_path: applications/postcode_splitter/Dockerfile
      build_context: .
      build_args: |
        DEV_DB_HOST=$DEV_DB_HOST
@ -191,7 +193,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: postcodeSplitter
-      lambda_path: infrastructure/terraform/lambda/postcodeSplitter
+      lambda_path: deployment/terraform/lambda/postcodeSplitter
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: postcode_splitter-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.postcodeSplitter_image.outputs.image_digest }}
@ -231,7 +233,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: bulk_address2uprn_combiner
-      lambda_path: infrastructure/terraform/lambda/bulk_address2uprn_combiner
+      lambda_path: deployment/terraform/lambda/bulk_address2uprn_combiner
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: bulk_address2uprn_combiner-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.bulk_address2uprn_combiner_image.outputs.image_digest }}
@ -271,7 +273,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: condition-etl
-      lambda_path: infrastructure/terraform/lambda/condition-etl
+      lambda_path: deployment/terraform/lambda/condition-etl
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: condition-etl-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.condition_etl_image.outputs.image_digest }}
@ -311,7 +313,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: categorisation
-      lambda_path: infrastructure/terraform/lambda/categorisation
+      lambda_path: deployment/terraform/lambda/categorisation
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: categorisation-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.categorisation_image.outputs.image_digest }}
@ -351,7 +353,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: ordnanceSurvey
-      lambda_path: infrastructure/terraform/lambda/ordnanceSurvey
+      lambda_path: deployment/terraform/lambda/ordnanceSurvey
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: ordnance-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.ordnanceSurvey_image.outputs.image_digest }}
@ -386,7 +388,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: pashub_to_ara
-      lambda_path: infrastructure/terraform/lambda/pashub_to_ara
+      lambda_path: deployment/terraform/lambda/pashub_to_ara
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: pashub_to_ara-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.pashub_to_ara_image.outputs.image_digest }}
@ -419,7 +421,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: ara_fast_api
-      lambda_path: infrastructure/terraform/lambda/fast-api
+      lambda_path: deployment/terraform/lambda/fast-api
      stage: ${{ needs.determine_stage.outputs.stage }}
      terraform_apply: ${{ needs.determine_stage.outputs.terraform_apply }}
    secrets:
@ -458,17 +460,17 @@ jobs:
      - uses: hashicorp/setup-terraform@v3

      - name: Terraform Init
-        working-directory: infrastructure/terraform/cdn_certificate
+        working-directory: deployment/terraform/cdn_certificate
        run: terraform init -reconfigure

      - name: Terraform Workspace
-        working-directory: infrastructure/terraform/cdn_certificate
+        working-directory: deployment/terraform/cdn_certificate
        run: |
          terraform workspace select $STAGE \
            || terraform workspace new $STAGE

      - name: Terraform Plan
-        working-directory: infrastructure/terraform/cdn_certificate
+        working-directory: deployment/terraform/cdn_certificate
        run: |
          terraform plan \
            -var="stage=${STAGE}" \
@ -476,7 +478,7 @@ jobs:

      - name: Terraform Apply
        if: env.TERRAFORM_APPLY == 'true'
-        working-directory: infrastructure/terraform/cdn_certificate
+        working-directory: deployment/terraform/cdn_certificate
        run: terraform apply -auto-approve tfplan


@ -503,17 +505,17 @@ jobs:
      - uses: hashicorp/setup-terraform@v3

      - name: Terraform Init
-        working-directory: infrastructure/terraform/cdn
+        working-directory: deployment/terraform/cdn
        run: terraform init -reconfigure

      - name: Terraform Workspace
-        working-directory: infrastructure/terraform/cdn
+        working-directory: deployment/terraform/cdn
        run: |
          terraform workspace select $STAGE \
            || terraform workspace new $STAGE

      - name: Terraform Plan
-        working-directory: infrastructure/terraform/cdn
+        working-directory: deployment/terraform/cdn
        run: |
          terraform plan \
            -var="stage=${STAGE}" \
@ -521,7 +523,7 @@ jobs:

      - name: Terraform Apply
        if: env.TERRAFORM_APPLY == 'true'
-        working-directory: infrastructure/terraform/cdn
+        working-directory: deployment/terraform/cdn
        run: terraform apply -auto-approve tfplan

  # ============================================================
@ -562,7 +564,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: magic_plan
-      lambda_path: infrastructure/terraform/lambda/magic_plan
+      lambda_path: deployment/terraform/lambda/magic_plan
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: magic-plan-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.magic_plan_image.outputs.image_digest }}
@ -585,7 +587,7 @@ jobs:
    uses: ./.github/workflows/_deploy_lambda.yml
    with:
      lambda_name: hubspot-etl-to-ara
-      lambda_path: infrastructure/terraform/lambda/hubspot_deal_etl
+      lambda_path: deployment/terraform/lambda/hubspot_deal_etl
      stage: ${{ needs.determine_stage.outputs.stage }}
      ecr_repo: hubspot-etl-${{ needs.determine_stage.outputs.stage }}
      image_digest: ${{ needs.hubspot_etl_image.outputs.image_digest }}
--- a/.github/workflows/lambda_smoke_tests.yml
+++ b/.github/workflows/lambda_smoke_tests.yml
@ -36,6 +36,13 @@ jobs:
      build_context: .
      service_name: postcode-splitter

+  postcode_splitter_ddd_smoke_test:
+    uses: ./.github/workflows/_smoke_test_lambda.yml
+    with:
+      dockerfile_path: applications/postcode_splitter/Dockerfile
+      build_context: .
+      service_name: postcode-splitter-ddd
+
  # ============================================================
  # Bulk Address2UPRN Combiner
  # ============================================================
--- a/.github/workflows/unit_tests.yml
+++ b/.github/workflows/unit_tests.yml
@ -60,3 +60,15 @@ jobs:
            -e DB_PASSWORD=test \
            -e DB_PORT=5432 \
            model-test pytest -vv -m 'not integration'
+
+      # The DDD rewrite (tests/) defines SQLModel table classes that map to the
+      # same physical tables as the legacy backend models. Both sets share the
+      # one global SQLModel.metadata, so they cannot be imported into the same
+      # pytest process. It runs as a separate invocation until the legacy
+      # models are retired. Its DB is spawned in-process by pytest-postgresql,
+      # so no DB service or env is required.
+      - name: Run DDD tests
+        run: |
+          docker run --rm \
+            --network host \
+            model-test pytest -vv tests/
--- a/.gitignore
+++ b/.gitignore
@ -121,6 +121,7 @@ celerybeat.pid

 # Environments
 .env
+.env.local
 .venv
 env/
 venv/
--- a/AGENTS.md
+++ b/AGENTS.md
@ -1,29 +0,0 @@
-
-<!-- BACKLOG.MD MCP GUIDELINES START -->
-
-<CRITICAL_INSTRUCTION>
-
-## BACKLOG WORKFLOW INSTRUCTIONS
-
-This project uses Backlog.md MCP for all task and project management activities.
-
-**CRITICAL GUIDANCE**
-
- If your client supports MCP resources, read `backlog://workflow/overview` to understand when and how to use Backlog for this project.
- If your client only supports tools or the above request fails, call `backlog.get_backlog_instructions()` to load the tool-oriented overview. Use the `instruction` selector when you need `task-creation`, `task-execution`, or `task-finalization`.
-
- **First time working here?** Read the overview resource IMMEDIATELY to learn the workflow
- **Already familiar?** You should have the overview cached ("## Backlog.md Overview (MCP)")
- **When to read it**: BEFORE creating tasks, or when you're unsure whether to track work
-
-These guides cover:
- Decision framework for when to create tasks
- Search-first workflow to avoid duplicates
- Links to detailed guides for task creation, execution, and finalization
- MCP tools reference
-
-You MUST read the overview resource to understand the complete workflow. The information is NOT summarized here.
-
-</CRITICAL_INSTRUCTION>
-
-<!-- BACKLOG.MD MCP GUIDELINES END -->
--- a/CLAUDE.md
+++ b/CLAUDE.md
@ -1,33 +1,4 @@

-<!-- BACKLOG.MD MCP GUIDELINES START -->
-
-<CRITICAL_INSTRUCTION>
-
-## BACKLOG WORKFLOW INSTRUCTIONS
-
-This project uses Backlog.md MCP for all task and project management activities.
-
-**CRITICAL GUIDANCE**
-
- If your client supports MCP resources, read `backlog://workflow/overview` to understand when and how to use Backlog for this project.
- If your client only supports tools or the above request fails, call `backlog.get_backlog_instructions()` to load the tool-oriented overview. Use the `instruction` selector when you need `task-creation`, `task-execution`, or `task-finalization`.
-
- **First time working here?** Read the overview resource IMMEDIATELY to learn the workflow
- **Already familiar?** You should have the overview cached ("## Backlog.md Overview (MCP)")
- **When to read it**: BEFORE creating tasks, or when you're unsure whether to track work
-
-These guides cover:
- Decision framework for when to create tasks
- Search-first workflow to avoid duplicates
- Links to detailed guides for task creation, execution, and finalization
- MCP tools reference
-
-You MUST read the overview resource to understand the complete workflow. The information is NOT summarized here.
-
-</CRITICAL_INSTRUCTION>
-
-<!-- BACKLOG.MD MCP GUIDELINES END -->
-
 ## Available Skills

 Five Claude Code skills are installed in this repo's dev container. Each maps to a phase of the feature lifecycle.
--- a/Dockerfile.test.dockerignore
+++ b/Dockerfile.test.dockerignore
@ -4,7 +4,7 @@ model_data/local_data/
 backend/node_modules/
 backend/.idea/
 backend/.env
-infrastructure/
+deployment/
 data_collection/
 node_modules/
 conservation_areas/
--- a/UBIQUITOUS_LANGUAGE.md
+++ b/UBIQUITOUS_LANGUAGE.md
@ -23,7 +23,7 @@ Invoke `/ubiquitous-language` in any session to extract new terms from the conve
 |------|------------|------------------|
 | **UPRN** | Unique Property Reference Number — the government-issued permanent identifier for a physical address in the UK. | "property ID", "address ID", "code" |
 | **Postcode** | A UK postal code used to group nearby addresses; the primary search key for finding EPC records. | "zip code", "postal code" |
-| **User Address** | A free-text address string provided by a user or imported from a customer dataset, before any normalisation or matching. | "user input", "raw address", "user_inputed_address" |
+| **User Address** | A structured dataclass (`domain.addresses.user_address.UserAddress`) capturing a customer-supplied address: a free-text `user_address` line, a canonical `postcode` (sanitised on construction), and an optional `internal_reference`. The bare string sense -- the raw free-text address line as it arrives from upstream ingestion, before being wrapped -- remains valid when discussing CSV columns, API payloads, or other upstream contexts; in domain code, prefer the dataclass. | "user input", "raw address", "user_inputed_address" |
 | **Dwelling** | A single residential unit that can hold an EPC — a house, flat, or maisonette. | "property", "unit", "home" |

 ## Address Matching
@ -72,7 +72,7 @@ Invoke `/ubiquitous-language` in any session to extract new terms from the conve

 ## Flagged ambiguities

- **"address"** appears as both the raw **User Address** (free-text from customer data) and a structured field on an **EPC Search Result** (normalised address lines). Always qualify: "user address" vs "EPC address" or "address line 1".
+- **"address"** appears as both the raw **User Address** (free-text from customer data, or the structured `UserAddress` dataclass that wraps it) and a structured field on an **EPC Search Result** (normalised address lines). Always qualify: "user address" vs "EPC address" or "address line 1". Within `domain/`, **User Address** specifically means the `UserAddress` dataclass; in upstream ingestion contexts (CSV columns, SQS payloads) it can still mean the raw string sense.
 - **"score"** is used for the `AddressMatch.score()` function output, the `lexiscore` DataFrame column, and informally in conversation. Prefer **Lexiscore** in domain discussions; reserve "score" for method-level code comments.
 - **"user_inputed_address"** in `backend/address2UPRN/main.py` is a misspelling and a synonym for **User Address** — the canonical term. New code should use `user_address`.
 - **"EPC"** is overloaded as both the document (an Energy Performance Certificate) and the rating band letter. Use **EPC** for the document and **EPC Band** for the letter.
--- a/applications/init.py
+++ b/applications/init.py
--- a/applications/postcode_splitter/Dockerfile
+++ b/applications/postcode_splitter/Dockerfile
@ -0,0 +1,34 @@
+FROM public.ecr.aws/lambda/python:3.11
+
+# Postgres host/port/database are baked into the image at build time from
+# the deploy workflow's --build-arg values (GitHub Actions DEV_DB_* secrets),
+# mirroring backend/postcode_splitter/handler/Dockerfile. They map onto the
+# POSTGRES_* names PostgresConfig.from_env reads. Username/password are NOT
+# baked in -- Terraform injects those as Lambda env vars from Secrets Manager.
+ARG DEV_DB_HOST
+ARG DEV_DB_PORT
+ARG DEV_DB_NAME
+
+ENV POSTGRES_HOST=${DEV_DB_HOST}
+ENV POSTGRES_PORT=${DEV_DB_PORT}
+ENV POSTGRES_DATABASE=${DEV_DB_NAME}
+
+WORKDIR /var/task
+
+COPY applications/postcode_splitter/requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+# Copy the layered source the handler imports from. The new splitter pulls
+# only DDD-shaped packages — no pandas, no legacy backend/.
+COPY domain/ domain/
+COPY infrastructure/ infrastructure/
+COPY orchestration/ orchestration/
+COPY repositories/ repositories/
+COPY utilities/ utilities/
+COPY applications/ applications/
+
+# Place the handler at the Lambda task root so the runtime can resolve
+# ``main.handler`` without an extra package prefix.
+COPY applications/postcode_splitter/handler.py /var/task/main.py
+
+CMD ["main.handler"]
--- a/applications/postcode_splitter/init.py
+++ b/applications/postcode_splitter/init.py
--- a/applications/postcode_splitter/handler.py
+++ b/applications/postcode_splitter/handler.py
@ -0,0 +1,52 @@
+from __future__ import annotations
+
+import os
+from typing import Any
+
+import boto3
+
+from applications.postcode_splitter.postcode_splitter_trigger_body import (
+    PostcodeSplitterTriggerBody,
+)
+from infrastructure.address2uprn_queue_client import Address2UprnQueueClient
+from infrastructure.csv_s3_client import CsvS3Client
+from orchestration.postcode_splitter_orchestrator import PostcodeSplitterOrchestrator
+from orchestration.task_orchestrator import TaskOrchestrator
+from repositories.user_address.user_address_csv_s3_repository import (
+    UserAddressCsvS3Repository,
+)
+from utilities.aws_lambda.subtask_handler import subtask_handler
+
+
+@subtask_handler()
+def handler(
+    body: dict[str, Any], context: Any, task_orchestrator: TaskOrchestrator
+) -> dict[str, list[str]]:
+    trigger = PostcodeSplitterTriggerBody.model_validate(body)
+
+    bucket = os.environ["S3_BUCKET_NAME"]
+    queue_url = os.environ["ADDRESS2UPRN_QUEUE_URL"]
+
+    # boto3.client is overloaded per-service in the installed stubs; cast
+    # to Any so the strict-mode checker treats it as opaque.
+    boto3_client: Any = boto3.client  # pyright: ignore[reportUnknownMemberType, reportUnknownVariableType]
+    boto_s3: Any = boto3_client("s3")
+    boto_sqs: Any = boto3_client("sqs")
+
+    csv_client = CsvS3Client(boto_s3, bucket)
+    user_address_repo = UserAddressCsvS3Repository(csv_client, bucket)
+    queue_client = Address2UprnQueueClient(boto_sqs, queue_url)
+
+    splitter = PostcodeSplitterOrchestrator(
+        task_orchestrator=task_orchestrator,
+        user_address_repo=user_address_repo,
+        queue_client=queue_client,
+    )
+
+    child_ids = splitter.split_and_dispatch(
+        parent_task_id=trigger.task_id,
+        parent_subtask_id=trigger.sub_task_id,
+        input_s3_uri=trigger.s3_uri,
+    )
+
+    return {"child_subtask_ids": [str(cid) for cid in child_ids]}
--- a/applications/postcode_splitter/local_handler/.env.local.example
+++ b/applications/postcode_splitter/local_handler/.env.local.example
@ -0,0 +1,34 @@
+# Local-test environment for the postcode_splitter Lambda.
+#
+#   cp .env.local.example .env.local   then fill in the values below.
+#
+# .env.local is gitignored. The container hits REAL AWS and a REAL Postgres,
+# so every value here points at infrastructure that actually exists.
+#
+# NOTE: the new DDD code uses different env var names than the repo root
+# .env. The mapping (root .env name -> var here) is given per section.
+# Keep comments on their own lines — docker-compose's env_file parser folds a
+# trailing "# ..." into the value.
+
+# --- Postgres (orchestration/default_orchestrator -> PostgresConfig.from_env) ---
+# POSTGRES_HOST <- DB_HOST, PORT <- DB_PORT, USERNAME <- DB_USERNAME,
+# PASSWORD <- DB_PASSWORD, DATABASE <- DB_NAME.
+POSTGRES_HOST=
+POSTGRES_PORT=5432
+POSTGRES_USERNAME=
+POSTGRES_PASSWORD=
+POSTGRES_DATABASE=
+# POSTGRES_DRIVER=psycopg2   (optional; defaults to psycopg2)
+
+# --- Handler config (applications/postcode_splitter/handler.py) ---
+# S3_BUCKET_NAME: bucket holding the input address CSV (root .env: DATA_BUCKET).
+# ADDRESS2UPRN_QUEUE_URL: SQS queue the splitter fans batches out to; not in
+# the root .env (Terraform sets it in prod).
+S3_BUCKET_NAME=
+ADDRESS2UPRN_QUEUE_URL=
+
+# --- AWS credentials for boto3 (S3 + SQS clients) ---
+AWS_ACCESS_KEY_ID=
+AWS_SECRET_ACCESS_KEY=
+AWS_DEFAULT_REGION=eu-west-2
+# AWS_SESSION_TOKEN=   (only if using temporary/SSO credentials)
--- a/applications/postcode_splitter/local_handler/docker-compose.yml
+++ b/applications/postcode_splitter/local_handler/docker-compose.yml
@ -0,0 +1,9 @@
+services:
+  postcode-splitter:
+    build:
+      context: ../../../
+      dockerfile: applications/postcode_splitter/Dockerfile
+    ports:
+      - "9001:8080"
+    env_file:
+      - .env.local
--- a/applications/postcode_splitter/local_handler/invoke_local_lambda.py
+++ b/applications/postcode_splitter/local_handler/invoke_local_lambda.py
@ -0,0 +1,28 @@
+#!/usr/bin/env python3
+import json
+import requests
+
+HOST = "localhost"
+PORT = "9001"
+
+LAMBDA_URL = f"http://{HOST}:{PORT}/2015-03-31/functions/function/invocations"
+
+payload = {
+    "Records": [
+        {
+            "body": json.dumps(
+                {
+                    "task_id": "f4b3332f-c0cc-481f-96a5-d39860a647cf",
+                    "sub_task_id": "14c042de-40c4-473b-8cd8-72c983a94a8d",
+                    "s3_uri": "s3://retrofit-data-dev/ara_raw_inputs/calico/Calico Homes Full list EPC Properties(Sheet2) (1) (1).csv",
+                }
+            )
+        }
+    ]
+}
+
+response = requests.post(LAMBDA_URL, json=payload)
+
+print("Status code:", response.status_code)
+print("Response:")
+print(response.text)
--- a/applications/postcode_splitter/local_handler/run_local.sh
+++ b/applications/postcode_splitter/local_handler/run_local.sh
@ -0,0 +1,12 @@
+#!/usr/bin/env bash
+set -euo pipefail
+cd "$(dirname "$0")"
+
+if [ ! -f .env.local ]; then
+  cp .env.local.example .env.local
+  echo "Created .env.local from the template — fill it in, then re-run." >&2
+  exit 1
+fi
+
+docker compose build --no-cache
+docker compose up --force-recreate
--- a/applications/postcode_splitter/postcode_splitter_trigger_body.py
+++ b/applications/postcode_splitter/postcode_splitter_trigger_body.py
@ -0,0 +1,11 @@
+from uuid import UUID
+
+from pydantic import BaseModel, ConfigDict
+
+
+class PostcodeSplitterTriggerBody(BaseModel):
+    model_config = ConfigDict(extra="allow")
+
+    task_id: UUID
+    sub_task_id: UUID
+    s3_uri: str
--- a/applications/postcode_splitter/requirements.txt
+++ b/applications/postcode_splitter/requirements.txt
@ -0,0 +1,4 @@
+boto3
+pydantic
+sqlmodel
+psycopg2-binary
--- a/asset_list/app.py
+++ b/asset_list/app.py
@ -79,23 +79,23 @@ def app():
    """

    data_folder = "/workspaces/model/asset_list"
-    data_filename = "input.xlsx"
-    sheet_name = "Handovers"
-    postcode_column = "POSTCODE"
-    address1_column = "Full Addres"
+    data_filename = "lincs_address_list.xlsx"
+    sheet_name = "Sheet1"
+    postcode_column = "Postcode"
+    address1_column = "Deal Name"
    address1_method = None
-    fulladdress_column = "Full Addres"
+    fulladdress_column = "Deal Name"
    address_cols_to_concat = []
    missing_postcodes_method = None
    landlord_year_built = None
-    landlord_os_uprn = "domna_found_uprn"
-    landlord_property_type = "PROPERTY TYPE"  # Good to include if landlord gave
-    landlord_built_form = "Type Description"  # Good to include if landlord gave
+    landlord_os_uprn = None
+    landlord_property_type = None  # Good to include if landlord gave
+    landlord_built_form = None  # Good to include if landlord gave
    landlord_wall_construction = None
    landlord_roof_construction = None
    landlord_heating_system = None
    landlord_existing_pv = None
-    landlord_property_id = "PROP REF"
+    landlord_property_id = "landlord_id"
    landlord_sap = None
    outcomes_filename = None
    outcomes_sheetname = None
@ -468,9 +468,3 @@ def app():
                asset_list.duplicated_addresses.to_excel(
                    writer, sheet_name="Duplicate Properties", index=False
                )
-
-
-
-
-for key,value in dict.items():
-    lsakjfldsa
--- a/backend/address2UPRN/handler/Dockerfile
+++ b/backend/address2UPRN/handler/Dockerfile
@ -6,11 +6,13 @@ ARG DEV_DB_HOST
 ARG DEV_DB_PORT
 ARG DEV_DB_NAME
 ARG EPC_AUTH_TOKEN
+ARG OPEN_EPC_API_TOKEN

 ENV DB_HOST=${DEV_DB_HOST}
 ENV DB_PORT=${DEV_DB_PORT}
 ENV DB_NAME=${DEV_DB_NAME}
 ENV EPC_AUTH_TOKEN=${EPC_AUTH_TOKEN}
+ENV OPEN_EPC_API_TOKEN=${OPEN_EPC_API_TOKEN}


 # Set working directory (Lambda task root)
--- a/backend/address2UPRN/handler/requirements.txt
+++ b/backend/address2UPRN/handler/requirements.txt
@ -8,4 +8,5 @@ boto3==1.35.44
 sqlmodel
 sqlalchemy==2.0.36
 psycopg2-binary==2.9.10
-pydantic-settings==2.6.0
+pydantic-settings==2.6.0
+httpx
--- a/infrastructure/terraform/README.md
+++ b/infrastructure/terraform/README.md
--- a/infrastructure/terraform/cdn/main.tf
+++ b/infrastructure/terraform/cdn/main.tf
--- a/infrastructure/terraform/cdn/provider.tf
+++ b/infrastructure/terraform/cdn/provider.tf
--- a/infrastructure/terraform/cdn/variables.tf
+++ b/infrastructure/terraform/cdn/variables.tf
--- a/infrastructure/terraform/cdn_certificate/main.tf
+++ b/infrastructure/terraform/cdn_certificate/main.tf
--- a/infrastructure/terraform/cdn_certificate/outputs.tf
+++ b/infrastructure/terraform/cdn_certificate/outputs.tf
--- a/infrastructure/terraform/cdn_certificate/provider.tf
+++ b/infrastructure/terraform/cdn_certificate/provider.tf
--- a/infrastructure/terraform/cdn_certificate/variables.tf
+++ b/infrastructure/terraform/cdn_certificate/variables.tf
--- a/infrastructure/terraform/lambda/_template/README.md
+++ b/infrastructure/terraform/lambda/_template/README.md
@ -10,7 +10,7 @@
 ### 2. Add infrastructure prerequisites (shared stack)
 - Add a new ECR repository in:

-  infrastructure/terraform/shared/main.tf
+  deployment/terraform/shared/main.tf

 - Create a PR to deploy this to main then dev in order to deploy the shared stack

--- a/infrastructure/terraform/lambda/_template/main.tf
+++ b/infrastructure/terraform/lambda/_template/main.tf
--- a/infrastructure/terraform/lambda/_template/provider.tf
+++ b/infrastructure/terraform/lambda/_template/provider.tf
--- a/infrastructure/terraform/lambda/_template/variables.tf
+++ b/infrastructure/terraform/lambda/_template/variables.tf
--- a/infrastructure/terraform/lambda/address2UPRN/main.tf
+++ b/infrastructure/terraform/lambda/address2UPRN/main.tf
--- a/infrastructure/terraform/lambda/address2UPRN/outputs.tf
+++ b/infrastructure/terraform/lambda/address2UPRN/outputs.tf
--- a/infrastructure/terraform/lambda/address2UPRN/provider.tf
+++ b/infrastructure/terraform/lambda/address2UPRN/provider.tf
--- a/infrastructure/terraform/lambda/address2UPRN/variables.tf
+++ b/infrastructure/terraform/lambda/address2UPRN/variables.tf
--- a/infrastructure/terraform/lambda/bulk_address2uprn_combiner/main.tf
+++ b/infrastructure/terraform/lambda/bulk_address2uprn_combiner/main.tf
--- a/infrastructure/terraform/lambda/bulk_address2uprn_combiner/outputs.tf
+++ b/infrastructure/terraform/lambda/bulk_address2uprn_combiner/outputs.tf
--- a/infrastructure/terraform/lambda/bulk_address2uprn_combiner/provider.tf
+++ b/infrastructure/terraform/lambda/bulk_address2uprn_combiner/provider.tf
--- a/infrastructure/terraform/lambda/bulk_address2uprn_combiner/variables.tf
+++ b/infrastructure/terraform/lambda/bulk_address2uprn_combiner/variables.tf
--- a/infrastructure/terraform/lambda/categorisation/main.tf
+++ b/infrastructure/terraform/lambda/categorisation/main.tf
--- a/infrastructure/terraform/lambda/categorisation/outputs.tf
+++ b/infrastructure/terraform/lambda/categorisation/outputs.tf
--- a/infrastructure/terraform/lambda/categorisation/provider.tf
+++ b/infrastructure/terraform/lambda/categorisation/provider.tf
--- a/infrastructure/terraform/lambda/categorisation/variables.tf
+++ b/infrastructure/terraform/lambda/categorisation/variables.tf
--- a/infrastructure/terraform/lambda/condition-etl/main.tf
+++ b/infrastructure/terraform/lambda/condition-etl/main.tf
--- a/infrastructure/terraform/lambda/condition-etl/provider.tf
+++ b/infrastructure/terraform/lambda/condition-etl/provider.tf
--- a/infrastructure/terraform/lambda/condition-etl/variables.tf
+++ b/infrastructure/terraform/lambda/condition-etl/variables.tf
--- a/infrastructure/terraform/lambda/ecmk_to_ara/main.tf
+++ b/infrastructure/terraform/lambda/ecmk_to_ara/main.tf
--- a/infrastructure/terraform/lambda/ecmk_to_ara/provider.tf
+++ b/infrastructure/terraform/lambda/ecmk_to_ara/provider.tf
--- a/infrastructure/terraform/lambda/ecmk_to_ara/variables.tf
+++ b/infrastructure/terraform/lambda/ecmk_to_ara/variables.tf
--- a/infrastructure/terraform/lambda/engine/main.tf
+++ b/infrastructure/terraform/lambda/engine/main.tf
--- a/infrastructure/terraform/lambda/engine/outputs.tf
+++ b/infrastructure/terraform/lambda/engine/outputs.tf
--- a/infrastructure/terraform/lambda/engine/provider.tf
+++ b/infrastructure/terraform/lambda/engine/provider.tf
--- a/infrastructure/terraform/lambda/engine/variables.tf
+++ b/infrastructure/terraform/lambda/engine/variables.tf
--- a/infrastructure/terraform/lambda/fast-api/main.tf
+++ b/infrastructure/terraform/lambda/fast-api/main.tf
--- a/infrastructure/terraform/lambda/fast-api/outputs.tf
+++ b/infrastructure/terraform/lambda/fast-api/outputs.tf
--- a/infrastructure/terraform/lambda/fast-api/provider.tf
+++ b/infrastructure/terraform/lambda/fast-api/provider.tf
--- a/infrastructure/terraform/lambda/fast-api/variables.tf
+++ b/infrastructure/terraform/lambda/fast-api/variables.tf
--- a/infrastructure/terraform/lambda/hubspot_deal_etl/main.tf
+++ b/infrastructure/terraform/lambda/hubspot_deal_etl/main.tf
--- a/infrastructure/terraform/lambda/hubspot_deal_etl/provider.tf
+++ b/infrastructure/terraform/lambda/hubspot_deal_etl/provider.tf
--- a/infrastructure/terraform/lambda/hubspot_deal_etl/variables.tf
+++ b/infrastructure/terraform/lambda/hubspot_deal_etl/variables.tf
--- a/infrastructure/terraform/lambda/magic_plan/main.tf
+++ b/infrastructure/terraform/lambda/magic_plan/main.tf
--- a/infrastructure/terraform/lambda/magic_plan/outputs.tf
+++ b/infrastructure/terraform/lambda/magic_plan/outputs.tf
--- a/infrastructure/terraform/lambda/magic_plan/provider.tf
+++ b/infrastructure/terraform/lambda/magic_plan/provider.tf
--- a/infrastructure/terraform/lambda/magic_plan/variables.tf
+++ b/infrastructure/terraform/lambda/magic_plan/variables.tf
--- a/infrastructure/terraform/lambda/ordnanceSurvey/main.tf
+++ b/infrastructure/terraform/lambda/ordnanceSurvey/main.tf
--- a/infrastructure/terraform/lambda/ordnanceSurvey/provider.tf
+++ b/infrastructure/terraform/lambda/ordnanceSurvey/provider.tf
--- a/infrastructure/terraform/lambda/ordnanceSurvey/variables.tf
+++ b/infrastructure/terraform/lambda/ordnanceSurvey/variables.tf
--- a/infrastructure/terraform/lambda/pashub_to_ara/main.tf
+++ b/infrastructure/terraform/lambda/pashub_to_ara/main.tf
--- a/infrastructure/terraform/lambda/pashub_to_ara/outputs.tf
+++ b/infrastructure/terraform/lambda/pashub_to_ara/outputs.tf
--- a/infrastructure/terraform/lambda/pashub_to_ara/provider.tf
+++ b/infrastructure/terraform/lambda/pashub_to_ara/provider.tf
--- a/infrastructure/terraform/lambda/pashub_to_ara/variables.tf
+++ b/infrastructure/terraform/lambda/pashub_to_ara/variables.tf
--- a/infrastructure/terraform/lambda/postcodeSplitter/main.tf
+++ b/infrastructure/terraform/lambda/postcodeSplitter/main.tf
@ -38,22 +38,8 @@ module "lambda" {
    {
      STAGE     = var.stage
      LOG_LEVEL = "info"
-      DB_USERNAME = local.db_credentials.db_assessment_model_username
-      DB_PASSWORD = local.db_credentials.db_assessment_model_password
-      GOOGLE_SOLAR_API_KEY = "test"
-      SAP_PREDICTIONS_BUCKET = "test"
-      CARBON_PREDICTIONS_BUCKET = "test"
-      HEAT_PREDICTIONS_BUCKET = "test"
-      HEATING_KWH_PREDICTIONS_BUCKET = "test"
-      HOTWATER_KWH_PREDICTIONS_BUCKET = "test"
-      API_KEY = "test"
-      ENVIRONMENT = "test"
-      SECRET_KEY = "test"
-      PLAN_TRIGGER_BUCKET = "test"
-      DATA_BUCKET = "test"
-      EPC_AUTH_TOKEN = "test"
-      ENGINE_SQS_URL = "test"
-      ENERGY_ASSESSMENTS_BUCKET = "test"
+      POSTGRES_USERNAME = local.db_credentials.db_assessment_model_username
+      POSTGRES_PASSWORD = local.db_credentials.db_assessment_model_password
      ADDRESS2UPRN_QUEUE_URL = data.terraform_remote_state.address2uprn.outputs.address2uprn_queue_url
      S3_BUCKET_NAME = data.terraform_remote_state.shared.outputs.retrofit_sap_data_bucket_name
    },
--- a/infrastructure/terraform/lambda/postcodeSplitter/outputs.tf
+++ b/infrastructure/terraform/lambda/postcodeSplitter/outputs.tf
--- a/infrastructure/terraform/lambda/postcodeSplitter/provider.tf
+++ b/infrastructure/terraform/lambda/postcodeSplitter/provider.tf
--- a/infrastructure/terraform/lambda/postcodeSplitter/variables.tf
+++ b/infrastructure/terraform/lambda/postcodeSplitter/variables.tf
--- a/infrastructure/terraform/modules/acm_certificate/main.tf
+++ b/infrastructure/terraform/modules/acm_certificate/main.tf
--- a/infrastructure/terraform/modules/acm_certificate/outputs.tf
+++ b/infrastructure/terraform/modules/acm_certificate/outputs.tf
--- a/infrastructure/terraform/modules/acm_certificate/variables.tf
+++ b/infrastructure/terraform/modules/acm_certificate/variables.tf
--- a/infrastructure/terraform/modules/cloudfront/main.tf
+++ b/infrastructure/terraform/modules/cloudfront/main.tf
--- a/infrastructure/terraform/modules/cloudfront/variables.tf
+++ b/infrastructure/terraform/modules/cloudfront/variables.tf
--- a/infrastructure/terraform/modules/container_registry/main.tf
+++ b/infrastructure/terraform/modules/container_registry/main.tf
--- a/infrastructure/terraform/modules/container_registry/outputs.tf
+++ b/infrastructure/terraform/modules/container_registry/outputs.tf
--- a/infrastructure/terraform/modules/container_registry/variables.tf
+++ b/infrastructure/terraform/modules/container_registry/variables.tf
--- a/infrastructure/terraform/modules/ecr/main.tf
+++ b/infrastructure/terraform/modules/ecr/main.tf
--- a/infrastructure/terraform/modules/ecr/outputs.tf
+++ b/infrastructure/terraform/modules/ecr/outputs.tf
--- a/infrastructure/terraform/modules/ecr/variables.tf
+++ b/infrastructure/terraform/modules/ecr/variables.tf
--- a/infrastructure/terraform/modules/general_iam_policy/main.tf
+++ b/infrastructure/terraform/modules/general_iam_policy/main.tf
--- a/infrastructure/terraform/modules/general_iam_policy/outputs.tf
+++ b/infrastructure/terraform/modules/general_iam_policy/outputs.tf
--- a/infrastructure/terraform/modules/general_iam_policy/variables.tf
+++ b/infrastructure/terraform/modules/general_iam_policy/variables.tf
--- a/infrastructure/terraform/modules/lambda_execution_role/main.tf
+++ b/infrastructure/terraform/modules/lambda_execution_role/main.tf
--- a/infrastructure/terraform/modules/lambda_execution_role/outputs.tf
+++ b/infrastructure/terraform/modules/lambda_execution_role/outputs.tf
--- a/infrastructure/terraform/modules/lambda_execution_role/variables.tf
+++ b/infrastructure/terraform/modules/lambda_execution_role/variables.tf
--- a/infrastructure/terraform/modules/lambda_service/main.tf
+++ b/infrastructure/terraform/modules/lambda_service/main.tf
--- a/infrastructure/terraform/modules/lambda_service/outputs.tf
+++ b/infrastructure/terraform/modules/lambda_service/outputs.tf
--- a/infrastructure/terraform/modules/lambda_service/variables.tf
+++ b/infrastructure/terraform/modules/lambda_service/variables.tf
--- a/infrastructure/terraform/modules/lambda_service_zip/main.tf
+++ b/infrastructure/terraform/modules/lambda_service_zip/main.tf
--- a/Show more
+++ b/Show more
Author	SHA1	Message	Date
Jun-te Kim	326ec2485d	Merge pull request #1112 from Hestia-Homes/main Some checks failed Fast Api Backend Deploy / deploy (push) Has been cancelled Details Deploy infrastructure / determine_stage (push) Has been cancelled Details Deploy infrastructure / address2uprn_lambda (push) Has been cancelled Details Deploy infrastructure / shared_terraform (push) Has been cancelled Details Deploy infrastructure / ara_engine_image (push) Has been cancelled Details Deploy infrastructure / ara_engine_lambda (push) Has been cancelled Details Deploy infrastructure / address2uprn_image (push) Has been cancelled Details Deploy infrastructure / postcodeSplitter_image (push) Has been cancelled Details Deploy infrastructure / postcodeSplitter_lambda (push) Has been cancelled Details Deploy infrastructure / bulk_address2uprn_combiner_image (push) Has been cancelled Details Deploy infrastructure / bulk_address2uprn_combiner_lambda (push) Has been cancelled Details Deploy infrastructure / condition_etl_image (push) Has been cancelled Details Deploy infrastructure / condition_etl_lambda (push) Has been cancelled Details Deploy infrastructure / categorisation_image (push) Has been cancelled Details Deploy infrastructure / categorisation_lambda (push) Has been cancelled Details Deploy infrastructure / ordnanceSurvey_image (push) Has been cancelled Details Deploy infrastructure / ordnanceSurvey_lambda (push) Has been cancelled Details Deploy infrastructure / pashub_to_ara_image (push) Has been cancelled Details Deploy infrastructure / pashub_to_ara_lambda (push) Has been cancelled Details Deploy infrastructure / fast_api_lambda (push) Has been cancelled Details Deploy infrastructure / cloudfront_acm (push) Has been cancelled Details Deploy infrastructure / cloudfront_cdn (push) Has been cancelled Details Deploy infrastructure / hubspot_etl_image (push) Has been cancelled Details Deploy infrastructure / magic_plan_image (push) Has been cancelled Details Deploy infrastructure / magic_plan_lambda (push) Has been cancelled Details Deploy infrastructure / hubspot_etl_lambda (push) Has been cancelled Details epc token	2026-05-20 16:48:11 +01:00
Jun-te Kim	97947c9e32	Merge pull request #1111 from Hestia-Homes/feature/address2uprn_quick_fix epc token added	2026-05-20 16:46:58 +01:00
Jun-te Kim	53b211e951	epc token added	2026-05-20 15:43:41 +00:00
Jun-te Kim	b2873f9d0b	Merge pull request #1110 from Hestia-Homes/main deploy new post code splitter	2026-05-20 16:26:48 +01:00
Jun-te Kim	bd36f203e8	Merge pull request #1109 from Hestia-Homes/feature/rewrite_task_handler actually deploy postcode splitter	2026-05-20 16:26:07 +01:00
Jun-te Kim	78c1d150fa	added smoke test	2026-05-20 15:25:42 +00:00
Jun-te Kim	8610a0c875	actually deploy postcode splitter	2026-05-20 15:17:55 +00:00
Jun-te Kim	0fd0dfb1c7	Merge pull request #1108 from Hestia-Homes/main Postcode splitter rewrite	2026-05-20 16:02:22 +01:00
Jun-te Kim	9ad4f3359f	Merge pull request #1107 from Hestia-Homes/feature/rewrite_task_handler Feature/rewrite task handler and postcode splitter	2026-05-20 15:56:02 +01:00
Jun-te Kim	154b820b29	pytest.ini	2026-05-20 14:26:46 +00:00
Jun-te Kim	f10947699e	pytest.ini	2026-05-20 14:13:04 +00:00
Jun-te Kim	00f0cb5442	Merge pull request #1106 from Hestia-Homes/claude/Model-p3 Refactor postcode_splitter into the DDD layout (project #3)	2026-05-20 15:01:29 +01:00
Jun-te Kim	dc159e0b45	tests framework completed	2026-05-20 14:00:19 +00:00
Jun-te Kim	d0cf3d14ad	get rid of comments	2026-05-20 13:21:11 +00:00
Jun-te Kim	8bb90a5aa5	sanitisation of postcode	2026-05-20 12:57:03 +00:00
Jun-te Kim	914a8ed51e	postcode splliter working e2e	2026-05-20 11:07:40 +00:00
Jun-te Kim	0a04448217	applications/postcode_splitter: PostcodeSplitterOrchestrator + Lambda entrypoint slice Wires slice 1-5 primitives into a deployable splitter: - orchestration/postcode_splitter_orchestrator.py: PostcodeSplitterOrchestrator loads addresses via UserAddressRepository, groups by postcode via iter_postcode_grouped_batches, persists each batch under ara_postcode_splitter_batches/{task_id}/{subtask_id}/, creates a WAITING child SubTask, and publishes an address2UPRN SQS message per batch. - applications/postcode_splitter/: Lambda entrypoint. handler.py is decorated with @subtask_handler() so the parent SubTask lifecycle is decorator-owned; PostcodeSplitterTriggerBody validates the body. Dockerfile is the python:3.11 Lambda base with the DDD-shaped source layers and no pandas. - tests/orchestration/test_postcode_splitter_orchestrator.py: integration test using moto S3 + moto SQS + in-memory SQLite that exercises the full wiring against a fixture CSV spanning three postcode groups (one oversize) and asserts child count, persisted inputs, queue bodies, and dispatch order. backend/postcode_splitter/ and .github/workflows/deploy_terraform.yml are intentionally unchanged: the dockerfile_path flip is deferred until the companion backend/address2UPRN/ migration is also ready.	2026-05-19 17:46:12 +00:00
Jun-te Kim	708f1b5d18	repositories: UserAddressRepository + UserAddressCsvS3Repository (CSV-on-S3 adapter) Adds the persistence layer for UserAddress batches: - Abstract UserAddressRepository with load_batch / save_batch. - Concrete UserAddressCsvS3Repository over CsvS3Client: - load_batch reads canonical upload columns (Address 1/2/3, Postcode, Internal Reference), comma-joins non-empty address parts, and passes Internal Reference through (None when missing/empty). - save_batch writes a 3-column CSV (user_address,postcode, internal_reference) to {path_prefix}/{ISO datetime}_{uuid8}.csv and returns the s3://bucket/key URI. - Postcode sanitisation flows through UserAddress.__post_init__; the repo never calls sanitise_postcode directly. Tests (moto-backed) cover: three-line address load, Address-1-only load, missing Internal Reference, save->reload round trip, and unique-filename-per-save. pyright --strict clean. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>	2026-05-19 17:37:02 +00:00
Jun-te Kim	d70e8a9e53	utilities/aws_lambda: @subtask_handler injects TaskOrchestrator as third positional arg The wrapped function now receives the decorator-owned TaskOrchestrator as a third positional argument so handlers can compose their own use-case orchestrator that shares the session, instead of opening a second Postgres connection per invocation. Both existing callers (backend/ordnanceSurvey/main.py and backend/bulk_address2uprn_combiner/main.py) have their signatures extended to accept the new positional argument (typed Optional[TaskOrchestrator] so the legacy backend.utils.subtasks.subtask_handler — which only passes two args — keeps working until the migration to the new decorator lands). @task_handler is intentionally unchanged in this slice; symmetry is deferred per issue #1103.	2026-05-19 17:31:27 +00:00
Jun-te Kim	d7f14033ba	orchestration: add TaskOrchestrator.create_child_subtask primitive Adds a primitive for creating a new WAITING SubTask under an existing parent Task, routing all SubTask creation through the orchestrator (replacing the legacy SubTaskInterface path used by the splitter). Skips _cascade because a new WAITING child against an IN_PROGRESS parent is a no-op under Task.recalculate_from_subtasks.	2026-05-19 17:19:41 +00:00
Jun-te Kim	7b00a33cd2	infrastructure: typed S3/SQS clients (S3Client, CsvS3Client, SqsClient, Address2UprnQueueClient) Slice 3/6 of the postcode_splitter refactor (Hestia-Homes/Model#1101). Introduces a thin typed infrastructure layer wrapping boto3 for the AWS side of the splitter. S3Client/SqsClient are bucket-/queue-bound byte adapters; CsvS3Client subclasses S3Client to round-trip CSV row dicts via the existing parse_s3_uri helper in utils/s3.py; Address2UprnQueueClient subclasses SqsClient to publish the typed {task_id, sub_task_id, s3_uri} fan-out body the downstream consumer expects. moto[s3,sqs] is pulled into test.requirements.txt and the new tests/infrastructure/ suite exercises each client against the moto backend (S3 round-trip, CSV round-trip, SQS send + body inspection, typed publish + body inspection). pyright --strict is clean on the new modules. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>	2026-05-19 17:12:21 +00:00
Jun-te Kim	6198d7a46d	postcode_splitter: pure domain (UserAddress, sanitise_postcode, postcode_batching) Slice 1/6 of the postcode_splitter refactor (Hestia-Homes/Model#1100). Introduces the pure-domain foundation under domain/, with no AWS, Postgres, or pandas. UserAddress is a frozen dataclass that sanitises its postcode in __post_init__ via the canonical sanitise_postcode helper, and iter_postcode_grouped_batches preserves the legacy splitter's batching invariants (group-by-postcode in insertion order, never split a group, oversize single-postcode groups dispatched whole, final flush). Updates UBIQUITOUS_LANGUAGE.md so the User Address term covers both the dataclass sense (preferred in domain code) and the raw upstream-string sense. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>	2026-05-19 16:45:47 +00:00
Jun-te Kim	54a674b5c8	added postcode splitter rewrite to ddd	2026-05-19 16:35:09 +00:00
Jun-te Kim	bc8ca3ead3	deployment from infrastructure	2026-05-19 12:55:30 +00:00