robbrad
diff --git a/‎uk_bin_collection/tests/input.json‎
Lines changed: 3 additions & 5 deletions b/‎uk_bin_collection/tests/input.json‎
Lines changed: 3 additions & 5 deletions
diff --git a/‎uk_bin_collection/uk_bin_collection/councils/BroxbourneCouncil.py‎
Lines changed: 16 additions & 1 deletion b/‎uk_bin_collection/uk_bin_collection/councils/BroxbourneCouncil.py‎
Lines changed: 16 additions & 1 deletion
diff --git a/‎uk_bin_collection/uk_bin_collection/councils/EastHertsCouncil.py‎
Lines changed: 27 additions & 116 deletions b/‎uk_bin_collection/uk_bin_collection/councils/EastHertsCouncil.py‎
Lines changed: 27 additions & 116 deletions
diff --git a/‎uk_bin_collection/uk_bin_collection/councils/EastLothianCouncil.py‎
Lines changed: 27 additions & 39 deletions b/‎uk_bin_collection/uk_bin_collection/councils/EastLothianCouncil.py‎
Lines changed: 27 additions & 39 deletions
@@ -761,13 +761,11 @@
     },
     "EastHertsCouncil": {
         "LAD24CD": "E07000097",
-        "house_number": "1",
-        "postcode": "CM20 2FZ",
         "skip_get_url": true,
-        "url": "https://www.eastherts.gov.uk",
-        "web_driver": "http://selenium:4444",
+        "uprn": "10023088183",
+        "url": "https://east-herts.co.uk/api/services/",
         "wiki_name": "East Herts Council",
-        "wiki_note": "Pass the house number and postcode in their respective parameters."
+        "wiki_note": "Pass the UPRN. You can find it using [FindMyAddress](https://www.findmyaddress.co.uk/search)."
     },
     "EastLindseyDistrictCouncil": {
         "house_number": "1",
 
@@ -22,10 +22,25 @@ def parse_data(self, page: str, **kwargs) -> dict:
         check_postcode(user_postcode)
 
         bindata = {"bins": []}
-        driver = create_webdriver(web_driver, headless, None, __name__)
+        # Use a realistic user agent to help bypass Cloudflare
+        user_agent = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
+        driver = create_webdriver(web_driver, headless, user_agent, __name__)
 
         try:
             driver.get("https://www.broxbourne.gov.uk/bin-collection-date")
+            
+            # Wait for Cloudflare challenge to complete
+            print("Waiting for page to load (Cloudflare check)...")
+            try:
+                WebDriverWait(driver, 45).until(
+                    lambda d: "Just a moment" not in d.title and d.title != "" and len(d.find_elements(By.TAG_NAME, "input")) > 0
+                )
+                print(f"Page loaded: {driver.title}")
+            except:
+                print(f"Timeout waiting for page load. Current title: {driver.title}")
+                # Try to continue anyway
+                pass
+            
             time.sleep(8)
 
             # Handle cookie banner with multiple attempts
 
@@ -1,7 +1,6 @@
-from bs4 import BeautifulSoup
-from selenium.webdriver.common.by import By
-from selenium.webdriver.support import expected_conditions as EC
-from selenium.webdriver.support.wait import WebDriverWait
+import json
+import requests
+from datetime import datetime
 
 from uk_bin_collection.uk_bin_collection.common import *
 from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
@@ -15,116 +14,28 @@ class CouncilClass(AbstractGetBinDataClass):
     """
 
     def parse_data(self, page: str, **kwargs) -> dict:
-        # Get and check UPRN
-        driver = None
-        try:
-            user_postcode = kwargs.get("postcode")
-            user_paon = kwargs.get("paon")
-            check_paon(user_paon)
-            check_postcode(user_postcode)
-            web_driver = kwargs.get("web_driver")
-            headless = kwargs.get("headless")
-            bindata = {"bins": []}
-
-            API_URL = "https://uhte-wrp.whitespacews.com"
-
-            # Create Selenium webdriver
-            driver = create_webdriver(web_driver, headless, None, __name__)
-            driver.get(API_URL)
-
-            # Click Find my bin collection day button
-            collectionButton = WebDriverWait(driver, 10).until(
-                EC.element_to_be_clickable((By.LINK_TEXT, "Find my bin collection day"))
-            )
-            collectionButton.click()
-
-            main_content = WebDriverWait(driver, 10).until(
-                EC.presence_of_element_located((By.ID, "main-content"))
-            )
-
-            # Wait for the property number field to appear then populate it
-            inputElement_number = WebDriverWait(driver, 10).until(
-                EC.element_to_be_clickable(
-                    (
-                        By.ID,
-                        "address_name_number",
-                    )
-                )
-            )
-            inputElement_number.send_keys(user_paon)
-
-            # Wait for the postcode field to appear then populate it
-            inputElement_postcode = WebDriverWait(driver, 10).until(
-                EC.element_to_be_clickable(
-                    (
-                        By.ID,
-                        "address_postcode",
-                    )
-                )
-            )
-            inputElement_postcode.send_keys(user_postcode)
-
-            # Click search button
-            continueButton = WebDriverWait(driver, 10).until(
-                EC.element_to_be_clickable(
-                    (
-                        By.ID,
-                        "Submit",
-                    )
-                )
-            )
-            continueButton.click()
-
-            # Wait for the 'Search Results' to appear and select the first result
-            property = WebDriverWait(driver, 10).until(
-                EC.element_to_be_clickable(
-                    (
-                        By.CSS_SELECTOR,
-                        "li.app-subnav__section-item a",
-                        # "app-subnav__link govuk-link clicker colordarkblue fontfamilyArial fontsize12rem",
-                        # "//a[starts-with(@aria-label, '{user_paon}')]",
-                    )
-                )
-            )
-            property.click()
-
-            upcoming_scheduled_collections = WebDriverWait(driver, 10).until(
-                EC.presence_of_element_located(
-                    (By.ID, "upcoming-scheduled-collections")
-                )
-            )
-
-            soup = BeautifulSoup(driver.page_source, features="html.parser")
-
-            collections = []
-            for collection in soup.find_all(
-                "u1",
-                class_="displayinlineblock justifycontentleft alignitemscenter margin0 padding0",
-            ):
-                date = collection.find(
-                    "p", string=lambda text: text and "/" in text
-                ).text.strip()  # Extract date
-                service = collection.find(
-                    "p", string=lambda text: text and "Collection Service" in text
-                ).text.strip()  # Extract service type
-                collections.append({"date": date, "service": service})
-
-            # Print the parsed data
-            for item in collections:
-
-                dict_data = {
-                    "type": item["service"],
-                    "collectionDate": item["date"],
-                }
-                bindata["bins"].append(dict_data)
-
-        except Exception as e:
-            # Here you can log the exception if needed
-            print(f"An error occurred: {e}")
-            # Optionally, re-raise the exception if you want it to propagate
-            raise
-        finally:
-            # This block ensures that the driver is closed regardless of an exception
-            if driver:
-                driver.quit()
+        user_uprn = kwargs.get("uprn")
+        check_uprn(user_uprn)
+        bindata = {"bins": []}
+        
+        # Make API request
+        api_url = f"https://east-herts.co.uk/api/services/{user_uprn}"
+        response = requests.get(api_url)
+        response.raise_for_status()
+        
+        data = response.json()
+        today = datetime.now().date()
+        
+        for service in data.get("services", []):
+            collection_date_str = service.get("collectionDate")
+            if collection_date_str:
+                collection_date = datetime.strptime(collection_date_str, "%Y-%m-%d").date()
+                # Only include future dates
+                if collection_date >= today:
+                    dict_data = {
+                        "type": service.get("binType", ""),
+                        "collectionDate": collection_date.strftime("%d/%m/%Y"),
+                    }
+                    bindata["bins"].append(dict_data)
+        
         return bindata
@@ -5,7 +5,6 @@
 from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
 
 
-# import the wonderful Beautiful Soup and the URL grabber
 class CouncilClass(AbstractGetBinDataClass):
     """
     Concrete classes have to implement all abstract operations of the
@@ -14,70 +13,59 @@ class CouncilClass(AbstractGetBinDataClass):
     """
 
     def parse_data(self, page: str, **kwargs) -> dict:
-
         user_postcode = kwargs.get("postcode")
         user_paon = kwargs.get("paon")
         check_postcode(user_postcode)
         check_paon(user_paon)
         bindata = {"bins": []}
 
-        URI = "http://collectiondates.eastlothian.gov.uk/ajax/your-calendar/load-streets-spring-2024.asp"
-
-        payload = {
-            "postcode": user_postcode,
-        }
-
+        # Get address ID from the streets endpoint
+        streets_uri = "https://collectiondates.eastlothian.gov.uk/ajax/your-calendar/load-streets-summer-2025.asp"
         headers = {
-            "Referer": "http://collectiondates.eastlothian.gov.uk/your-calendar",
+            "Referer": "https://collectiondates.eastlothian.gov.uk/your-calendar",
             "User-Agent": "Mozilla/5.0",
         }
-
-        # Make the GET request
-        response = requests.get(URI, headers=headers, params=payload)
-
-        # Parse the HTML with BeautifulSoup
+        
+        response = requests.get(streets_uri, params={"postcode": user_postcode}, headers=headers)
         soup = BeautifulSoup(response.text, "html.parser")
-
-        # Find the select dropdown
+        
         select = soup.find("select", id="SelectStreet")
-
-        # Find the option that contains "Flat 1"
+        if not select:
+            raise ValueError(f"No streets found for postcode {user_postcode}")
+        
         address = select.find("option", string=lambda text: text and user_paon in text)
-
-        URI = "http://collectiondates.eastlothian.gov.uk/ajax/your-calendar/load-recycling-summer-2024.asp"
-
-        payload = {
-            "id": address["value"],
-        }
-
-        # Make the GET request
-        response = requests.get(URI, headers=headers, params=payload)
-
-        # Parse the HTML with BeautifulSoup
+        if not address:
+            raise ValueError(f"Address '{user_paon}' not found for postcode {user_postcode}")
+        
+        address_id = address["value"]
+        
+        # Get collection data using the correct endpoint
+        collections_uri = "https://collectiondates.eastlothian.gov.uk/ajax/your-calendar/load-recycling-summer-2025.asp"
+        response = requests.get(collections_uri, params={"id": address_id}, headers=headers)
+        
         soup = BeautifulSoup(response.text, "html.parser")
-
+        
         # Extract collection details
         calendar_items = soup.find_all("div", class_="calendar-item")
         for item in calendar_items:
             waste_label = item.find("div", class_="waste-label").text.strip()
             waste_value = item.find("div", class_="waste-value").find("h4").text.strip()
-
+            
             try:
                 collection_date = datetime.strptime(
                     remove_ordinal_indicator_from_date_string(waste_value),
                     "%A %d %B %Y",
                 )
+                
+                bindata["bins"].append({
+                    "type": waste_label.replace(" is:", ""),
+                    "collectionDate": collection_date.strftime(date_format),
+                })
             except ValueError:
                 continue
-
-            dict_data = {
-                "type": waste_label.replace(" is:", ""),
-                "collectionDate": collection_date.strftime(date_format),
-            }
-            bindata["bins"].append(dict_data)
-
+        
         bindata["bins"].sort(
             key=lambda x: datetime.strptime(x.get("collectionDate"), date_format)
         )
-
+        
         return bindata