fix: #1565 - BCP Council

m26dvd · m26dvd · commit fa0ec28fce95 · 2025-09-10T00:23:14.000+01:00
diff --git a/uk_bin_collection/tests/input.json b/uk_bin_collection/tests/input.json
@@ -102,12 +102,9 @@
     },
     "BCPCouncil": {
         "LAD24CD": "E06000058",
-        "house_number": "3 HARBOUR VIEW ROAD, POOLE, BH14 0PD",
-        "postcode": "BH14 0PD",
-        "web_driver": "http://selenium:4444",
         "skip_get_url": true,
         "uprn": "100040810214",
-        "url": "https://online.bcpcouncil.gov.uk/bindaylookup/",
+        "url": "https://bcpportal.bcpcouncil.gov.uk/checkyourbincollection",
         "wiki_name": "Bournemouth, Christchurch and Poole",
         "wiki_note": "You will need to use [FindMyAddress](https://www.findmyaddress.co.uk/search) to find the UPRN."
     },
diff --git a/uk_bin_collection/uk_bin_collection/councils/BCPCouncil.py b/uk_bin_collection/uk_bin_collection/councils/BCPCouncil.py
@@ -1,15 +1,13 @@
-import json
 import time
-from datetime import datetime
-from bs4 import BeautifulSoup
-from selenium.webdriver.common.by import By
-from selenium.webdriver.support.ui import WebDriverWait, Select
-from selenium.webdriver.support import expected_conditions as EC
-from selenium.webdriver.common.keys import Keys
+
+import requests
+from dateutil.relativedelta import relativedelta
+
 from uk_bin_collection.uk_bin_collection.common import *
 from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
 
 
+# import the wonderful Beautiful Soup and the URL grabber
 class CouncilClass(AbstractGetBinDataClass):
     """
     Concrete classes have to implement all abstract operations of the
@@ -18,116 +16,43 @@ class CouncilClass(AbstractGetBinDataClass):
     """
 
     def parse_data(self, page: str, **kwargs) -> dict:
-        postcode = kwargs.get("postcode")
-        house_number = kwargs.get("paon")
-        web_driver = kwargs.get("web_driver")
-        headless = kwargs.get("headless", True)
-        
-        check_postcode(postcode)
-        check_paon(house_number)
-        
-        driver = create_webdriver(web_driver, headless=headless)
-        
-        try:
-            driver.get("https://bcpportal.bcpcouncil.gov.uk/checkyourbincollection/")
-            
-            # Handle cookie banner first
-            try:
-                cookie_button = WebDriverWait(driver, 5).until(
-                    EC.element_to_be_clickable((By.XPATH, "//button[contains(text(), 'Okay')]"))
-                )
-                cookie_button.click()
-            except:
-                pass  # Cookie banner might not be present
-            
-            # Wait for and enter postcode
-            postcode_input = WebDriverWait(driver, 10).until(
-                EC.presence_of_element_located((By.CSS_SELECTOR, "input[type='text']"))
-            )
-            postcode_input.clear()
-            postcode_input.send_keys(postcode)
-            
-            # Click the search span element
-            search_button = WebDriverWait(driver, 10).until(
-                EC.element_to_be_clickable((By.ID, "searchAddress"))
-            )
-            search_button.click()
-            
-            # Wait for address dropdown
-            select_element = WebDriverWait(driver, 10).until(
-                EC.presence_of_element_located((By.TAG_NAME, "select"))
-            )
-            
-            # Find and select the address containing the house number
-            address_option = WebDriverWait(driver, 10).until(
-                EC.element_to_be_clickable((By.XPATH, f"//option[contains(text(), 'HARBOUR VIEW ROAD')]"))
-            )
-            address_option.click()
-            
-            # Wait for bin collection results to load
-            WebDriverWait(driver, 15).until(
-                EC.presence_of_element_located((By.XPATH, "//td[contains(text(), 'collection')] | //th[contains(text(), 'collection')]"))
-            )
-            
-            # Find the table containing collection data by looking for a cell with 'collection' text
-            collection_table = WebDriverWait(driver, 10).until(
-                EC.presence_of_element_located((By.XPATH, "//td[contains(text(), 'collection')]/ancestor::table | //th[contains(text(), 'collection')]/ancestor::table"))
-            )
-            
-            # Parse the table data
-            soup = BeautifulSoup(driver.page_source, 'html.parser')
-            data = {"bins": []}
-            
-            # Find the table containing collection information
-            collection_cell = soup.find(['td', 'th'], string=lambda text: text and 'collection' in text.lower())
-            if collection_cell:
-                table = collection_cell.find_parent('table')
-                if table:
-                    rows = table.find_all('tr')
-                    for row in rows[1:]:  # Skip header row
-                        cells = row.find_all(['td', 'th'])
-                        if len(cells) >= 2:  # At least bin type and one collection date
-                            bin_type = cells[0].get_text(strip=True)
-                            next_collection = cells[1].get_text(strip=True) if len(cells) > 1 else ""
-                            following_collection = cells[2].get_text(strip=True) if len(cells) > 2 else ""
-                            
-                            
-                            # Process next collection date
-                            if bin_type and next_collection and "No collection" not in next_collection:
-                                try:
-                                    # Try multiple date formats
-                                    for date_fmt in ["%A, %d %B %Y", "%A %d %B %Y", "%d/%m/%Y", "%d-%m-%Y", "%Y-%m-%d"]:
-                                        try:
-                                            parsed_date = datetime.strptime(next_collection, date_fmt)
-                                            data["bins"].append({
-                                                "type": bin_type,
-                                                "collectionDate": parsed_date.strftime(date_format)
-                                            })
-                                            break
-                                        except ValueError:
-                                            continue
-                                except:
-                                    continue
-                            
-                            # Process following collection date
-                            if bin_type and following_collection and "No collection" not in following_collection and "download PDF" not in following_collection:
-                                try:
-                                    # Clean up the following collection text (remove PDF link text)
-                                    following_collection = following_collection.replace("download PDF", "").strip()
-                                    for date_fmt in ["%A, %d %B %Y", "%A %d %B %Y", "%d/%m/%Y", "%d-%m-%Y", "%Y-%m-%d"]:
-                                        try:
-                                            parsed_date = datetime.strptime(following_collection, date_fmt)
-                                            data["bins"].append({
-                                                "type": bin_type,
-                                                "collectionDate": parsed_date.strftime(date_format)
-                                            })
-                                            break
-                                        except ValueError:
-                                            continue
-                                except:
-                                    continue
-            
-            return data
-            
-        finally:
-            driver.quit()
+        # Make a BS4 object
+        uprn = kwargs.get("uprn")
+        # usrn = kwargs.get("paon")
+        check_uprn(uprn)
+        # check_usrn(usrn)
+        bindata = {"bins": []}
+
+        # uprn = uprn.zfill(12)
+
+        API_URL = "https://prod-17.uksouth.logic.azure.com/workflows/58253d7b7d754447acf9fe5fcf76f493/triggers/manual/paths/invoke?api-version=2016-06-01&sp=%2Ftriggers%2Fmanual%2Frun&sv=1.0&sig=TAvYIUFj6dzaP90XQCm2ElY6Cd34ze05I3ba7LKTiBs"
+
+        headers = {
+            "Content-Type": "application/json",
+            "Accept": "*/*",
+            "User-Agent": "Mozilla/5.0",
+            "Referer": "https://bcpportal.bcpcouncil.gov.uk/",
+        }
+        s = requests.session()
+        data = {
+            "uprn": uprn,
+        }
+
+        r = s.post(API_URL, json=data, headers=headers)
+        r.raise_for_status()
+
+        data = r.json()
+        rows_data = data["data"]
+        for row in rows_data:
+            bin_type = row["wasteContainerUsageTypeDescription"]
+            collections = row["scheduleDateRange"]
+            for collection in collections:
+                dict_data = {
+                    "type": bin_type,
+                    "collectionDate": datetime.strptime(
+                        collection, "%Y-%m-%d"
+                    ).strftime(date_format),
+                }
+                bindata["bins"].append(dict_data)
+
+        return bindata
diff --git a/wiki/Councils.md b/wiki/Councils.md
@@ -482,14 +482,11 @@ Note: You will need to use [FindMyAddress](https://www.findmyaddress.co.uk/searc
 
 ### Bournemouth, Christchurch and Poole
 ```commandline
-python collect_data.py BCPCouncil https://online.bcpcouncil.gov.uk/bindaylookup/ -s -u XXXXXXXX -p "XXXX XXX" -n XX -w http://HOST:PORT/
+python collect_data.py BCPCouncil https://bcpportal.bcpcouncil.gov.uk/checkyourbincollection -s -u XXXXXXXX
 ```
 Additional parameters:
 - `-s` - skip get URL
 - `-u` - UPRN
-- `-p` - postcode
-- `-n` - house number
-- `-w` - remote Selenium web driver URL (required for Home Assistant)
 
 Note: You will need to use [FindMyAddress](https://www.findmyaddress.co.uk/search) to find the UPRN.