From 48b807da201142bef87409bfdfc988812fafcae1 Mon Sep 17 00:00:00 2001 From: Jun-te Kim Date: Fri, 30 May 2025 09:09:36 +0000 Subject: [PATCH] save state --- etl/osmosis_complaince_address_to_files.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/etl/osmosis_complaince_address_to_files.py b/etl/osmosis_complaince_address_to_files.py index 1448375..620d572 100644 --- a/etl/osmosis_complaince_address_to_files.py +++ b/etl/osmosis_complaince_address_to_files.py @@ -10,6 +10,8 @@ from etl.scraper.scraper import SharePointScraper # board_id = "4965130190" # liz green board_id = "6097500103" +# Cocuun +# board_id = "5185076280" monday_key = "eyJhbGciOiJIUzI1NiJ9.eyJ0aWQiOjQ5ODc2ODQxOCwiYWFpIjoxMSwidWlkIjozNjE3ODAzNCwiaWFkIjoiMjAyNS0wNC0xMVQxMToyMzoxNy40NjdaIiwicGVyIjoibWU6d3JpdGUiLCJhY3RpZCI6MTM5OTc4MjMsInJnbiI6InVzZTEifQ.-2Lit4s46ZF6AXuMW9t0TxIaFLkHqD4Yo-PyM9i2XZY" monday = MondayClient(monday_key) @@ -24,6 +26,7 @@ parent_folder = "/Osmosis ACD/Osmosis ACD Projects/" # Change this per installer # parent_folder += "Stonewater/Wates/REDO" parent_folder += "Installer Documentation/Platform Housing Group/Liv Green" +# parent_folder += "Installer Documentation/Platform Housing Group/Cocuun/REDO" import re @@ -32,7 +35,7 @@ def sanitize_name(name: str, ignore_dot = False) -> str: if ignore_dot: name = ''.join(char for char in name if char.isalnum() or char.isspace() or char == ")" or char == "(").strip() else: - name = ''.join(char for char in name if char.isalnum() or char.isspace() or char == "." or char == ")" or char == "(").strip() + name = ''.join(char for char in name if char.isalnum() or char.isspace() or char == "." or char == ")" or char == "(" or char == "-" or char == "_").strip() name = re.sub(r'\s+', ' ', name) # Remove or replace other SharePoint-invalid characters if necessary @@ -138,7 +141,7 @@ if not name_id or not files_id: items = get_all_items(board_id, monday) for i,item in enumerate(tqdm(items)): - if i>123: + if i>329: item_name = item["name"] item_name = sanitize_name(item_name, ignore_dot=True) print(f"Item name is {item_name}")