PyPI - uk_bin_collection - Versions diffs - 0.119.0__py3-none-any.whl → 0.121.0__py3-none-any.whl - Mend

uk_bin_collection 0.119.0py3-none-any.whl → 0.121.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

uk_bin_collection/uk_bin_collection/councils/HackneyCouncil.py ADDED Viewed

@@ -0,0 +1,85 @@
+import time
+import requests
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_paon = kwargs.get("paon")
+        user_postcode = kwargs.get("postcode")
+        check_postcode(user_postcode)
+        check_paon(user_paon)
+        bindata = {"bins": []}
+        URI = "https://waste-api-hackney-live.ieg4.net/f806d91c-e133-43a6-ba9a-c0ae4f4cccf6/property/opensearch"
+        data = {
+            "Postcode": user_postcode,
+        }
+        headers = {"Content-Type": "application/json"}
+        # Make the GET request
+        response = requests.post(URI, json=data, headers=headers)
+        addresses = response.json()
+        for address in addresses["addressSummaries"]:
+            summary = address["summary"]
+            if user_paon in summary:
+                systemId = address["systemId"]
+        if systemId:
+            URI = f"https://waste-api-hackney-live.ieg4.net/f806d91c-e133-43a6-ba9a-c0ae4f4cccf6/alloywastepages/getproperty/{systemId}"
+            response = requests.get(URI)
+            address = response.json()
+            binIDs = address["providerSpecificFields"][
+                "attributes_wasteContainersAssignableWasteContainers"
+            ]
+            for binID in binIDs.split(","):
+                URI = f"https://waste-api-hackney-live.ieg4.net/f806d91c-e133-43a6-ba9a-c0ae4f4cccf6/alloywastepages/getbin/{binID}"
+                response = requests.get(URI)
+                getBin = response.json()
+                bin_type = getBin["subTitle"]
+                URI = f"https://waste-api-hackney-live.ieg4.net/f806d91c-e133-43a6-ba9a-c0ae4f4cccf6/alloywastepages/getcollection/{binID}"
+                response = requests.get(URI)
+                getcollection = response.json()
+                collectionID = getcollection["scheduleCodeWorkflowID"]
+                URI = f"https://waste-api-hackney-live.ieg4.net/f806d91c-e133-43a6-ba9a-c0ae4f4cccf6/alloywastepages/getworkflow/{collectionID}"
+                response = requests.get(URI)
+                collection_dates = response.json()
+                dates = collection_dates["trigger"]["dates"]
+                for date in dates:
+                    parsed_datetime = datetime.strptime(
+                        date, "%Y-%m-%dT%H:%M:%SZ"
+                    ).strftime(date_format)
+                    dict_data = {
+                        "type": bin_type.strip(),
+                        "collectionDate": parsed_datetime,
+                    }
+                    bindata["bins"].append(dict_data)
+        bindata["bins"].sort(
+            key=lambda x: datetime.strptime(x.get("collectionDate"), "%d/%m/%Y")
+        )
+        return bindata

uk_bin_collection/uk_bin_collection/councils/HartlepoolBoroughCouncil.py ADDED Viewed

@@ -0,0 +1,83 @@
+import time
+import requests
+from bs4 import BeautifulSoup
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_uprn = kwargs.get("uprn")
+        check_uprn(user_uprn)
+        bindata = {"bins": []}
+        SESSION_URL = "https://online.hartlepool.gov.uk/authapi/isauthenticated?uri=https%253A%252F%252Fonline.hartlepool.gov.uk%252Fservice%252FRefuse_and_recycling___check_bin_day&hostname=online.hartlepool.gov.uk&withCredentials=true"
+        API_URL = "https://online.hartlepool.gov.uk/apibroker/runLookup"
+        headers = {
+            "Content-Type": "application/json",
+            "Accept": "application/json",
+            "User-Agent": "Mozilla/5.0",
+            "X-Requested-With": "XMLHttpRequest",
+            "Referer": "https://online.hartlepool.gov.uk/fillform/?iframe_id=fillform-frame-1&db_id=",
+        }
+        s = requests.session()
+        r = s.get(SESSION_URL)
+        r.raise_for_status()
+        session_data = r.json()
+        sid = session_data["auth-session"]
+        params = {
+            "id": "5ec67e019ffdd",
+            "repeat_against": "",
+            "noRetry": "true",
+            "getOnlyTokens": "undefined",
+            "log_id": "",
+            "app_name": "AF-Renderer::Self",
+            # unix_timestamp
+            "_": str(int(time.time() * 1000)),
+            "sid": sid,
+        }
+        data = {
+            "formValues": {
+                "Section 1": {
+                    "collectionLocationUPRN": {
+                        "value": user_uprn,
+                    },
+                },
+            },
+        }
+        r = s.post(API_URL, json=data, headers=headers, params=params)
+        r.raise_for_status()
+        data = r.json()
+        rows_data = data["integration"]["transformed"]["rows_data"]["0"]
+        if not isinstance(rows_data, dict):
+            raise ValueError("Invalid data returned from API")
+        soup = BeautifulSoup(rows_data["HTMLCollectionDatesText"], "html.parser")
+        # Find all div elements containing the bin schedule
+        for div in soup.find_all("div"):
+            # Extract bin type and date from the span tag
+            text = div.find("span").text.strip()
+            bin_type, date = text.split(" ", 1)
+            dict_data = {
+                "type": bin_type,
+                "collectionDate": date,
+            }
+            bindata["bins"].append(dict_data)
+        return bindata

uk_bin_collection/uk_bin_collection/councils/KingsLynnandWestNorfolkBC.py ADDED Viewed

@@ -0,0 +1,59 @@
+import requests
+from bs4 import BeautifulSoup
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_uprn = kwargs.get("uprn")
+        check_uprn(user_uprn)
+        user_uprn = user_uprn.zfill(12)
+        bindata = {"bins": []}
+        URI = "https://www.west-norfolk.gov.uk/info/20174/bins_and_recycling_collection_dates"
+        headers = {"Cookie": f"bcklwn_uprn={user_uprn}"}
+        # Make the GET request
+        response = requests.get(URI, headers=headers)
+        soup = BeautifulSoup(response.content, features="html.parser")
+        soup.prettify()
+        # Find all bin_date_container divs
+        bin_date_containers = soup.find_all("div", class_="bin_date_container")
+        # Loop through each bin_date_container
+        for container in bin_date_containers:
+            # Extract the collection date
+            date = (
+                container.find("h3", class_="collectiondate").text.strip().rstrip(":")
+            )
+            # Extract the bin type from the alt attribute of the img tag
+            bin_type = container.find("img")["alt"]
+            dict_data = {
+                "type": bin_type,
+                "collectionDate": datetime.strptime(
+                    date,
+                    "%A %d %B %Y",
+                ).strftime("%d/%m/%Y"),
+            }
+            bindata["bins"].append(dict_data)
+        bindata["bins"].sort(
+            key=lambda x: datetime.strptime(x.get("collectionDate"), "%d/%m/%Y")
+        )
+        return bindata

uk_bin_collection/uk_bin_collection/councils/LondonBoroughHavering.py ADDED Viewed

@@ -0,0 +1,75 @@
+import time
+import requests
+from bs4 import BeautifulSoup
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_uprn = kwargs.get("uprn")
+        check_uprn(user_uprn)
+        bindata = {"bins": []}
+        URI = "https://lbhapiprod.azure-api.net"
+        endpoint = f"{URI}/whitespace/GetCollectionByUprnAndDate"
+        subscription_key = "2ea6a75f9ea34bb58d299a0c9f84e72e"
+        # Get today's date in 'YYYY-MM-DD' format
+        collection_date = datetime.now().strftime("%Y-%m-%d")
+        # Define the request headers
+        headers = {
+            "Content-Type": "application/json",
+            "Ocp-Apim-Subscription-Key": subscription_key,
+        }
+        # Define the request body
+        data = {
+            "getCollectionByUprnAndDate": {
+                "getCollectionByUprnAndDateInput": {
+                    "uprn": user_uprn,
+                    "nextCollectionFromDate": collection_date,
+                }
+            }
+        }
+        # Make the POST request
+        response = requests.post(endpoint, headers=headers, data=json.dumps(data))
+        response.raise_for_status()  # Raise an exception for HTTP errors
+        # Parse the JSON response
+        response_data = response.json()
+        collections = (
+            response_data.get("getCollectionByUprnAndDateResponse", {})
+            .get("getCollectionByUprnAndDateResult", {})
+            .get("Collections", [])
+        )
+        for collection in collections:
+            bin_type = collection["service"]
+            collection_date = collection["date"]
+            dict_data = {
+                "type": bin_type,
+                "collectionDate": datetime.strptime(
+                    collection_date,
+                    "%d/%m/%Y %H:%M:%S",
+                ).strftime(date_format),
+            }
+            bindata["bins"].append(dict_data)
+        bindata["bins"].sort(
+            key=lambda x: datetime.strptime(x.get("collectionDate"), date_format)
+        )
+        return bindata

uk_bin_collection/uk_bin_collection/councils/LondonBoroughLewisham.py ADDED Viewed

@@ -0,0 +1,132 @@
+import time
+from bs4 import BeautifulSoup
+from selenium.webdriver.common.by import By
+from selenium.webdriver.support import expected_conditions as EC
+from selenium.webdriver.support.ui import Select, WebDriverWait
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_uprn = kwargs.get("uprn")
+        user_postcode = kwargs.get("postcode")
+        web_driver = kwargs.get("web_driver")
+        headless = kwargs.get("headless")
+        check_uprn(user_uprn)
+        bindata = {"bins": []}
+        # Initialize the WebDriver (Chrome in this case)
+        driver = create_webdriver(
+            web_driver,
+            headless,
+            "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36",
+            __name__,
+        )
+        # Step 1: Navigate to the form page
+        driver.get(
+            "https://lewisham.gov.uk/myservices/recycling-and-rubbish/your-bins/collection"
+        )
+        try:
+            cookie_accept_button = WebDriverWait(driver, 5).until(
+                EC.element_to_be_clickable(
+                    (By.ID, "CybotCookiebotDialogBodyLevelButtonLevelOptinAllowAll")
+                )
+            )
+            cookie_accept_button.click()
+        except Exception:
+            print("No cookie consent banner found or already dismissed.")
+        # Wait for the form to load
+        WebDriverWait(driver, 10).until(
+            EC.presence_of_element_located((By.CLASS_NAME, "address-finder"))
+        )
+        # Step 2: Locate the input field for the postcode
+        postcode_input = driver.find_element(By.CLASS_NAME, "js-address-finder-input")
+        # Enter the postcode
+        postcode_input.send_keys(user_postcode)  # Replace with your desired postcode
+        time.sleep(1)  # Optional: Wait for the UI to react
+        # Step 4: Click the "Find address" button with retry logic
+        find_button = WebDriverWait(driver, 10).until(
+            EC.element_to_be_clickable(
+                (By.CLASS_NAME, "js-address-finder-step-address")
+            )
+        )
+        find_button.click()
+        # Wait for the address selector to appear and options to load
+        WebDriverWait(driver, 10).until(
+            lambda d: len(
+                d.find_element(By.ID, "address-selector").find_elements(
+                    By.TAG_NAME, "option"
+                )
+            )
+            > 1
+        )
+        # Select the dropdown and print available options
+        address_selector = driver.find_element(By.ID, "address-selector")
+        # Use Select class to interact with the dropdown
+        select = Select(address_selector)
+        if len(select.options) > 1:
+            select.select_by_value(user_uprn)
+        else:
+            print("No additional addresses available to select")
+        # Wait until the URL contains the expected substring
+        WebDriverWait(driver, 10).until(
+            EC.url_contains("/find-your-collection-day-result")
+        )
+        # Parse the HTML
+        soup = BeautifulSoup(driver.page_source, "html.parser")
+        # Extract the main container
+        collection_result = soup.find("div", class_="js-find-collection-result")
+        # Extract each collection type and its frequency/day
+        for strong_tag in collection_result.find_all("strong"):
+            bin_type = strong_tag.text.strip()  # e.g., "Food waste"
+            # Extract day from the sibling text
+            schedule_text = (
+                strong_tag.next_sibling.next_sibling.next_sibling.text.strip()
+                .split("on\n")[-1]
+                .replace("\n", "")
+                .replace("\t", "")
+            )
+            day = schedule_text.strip().split(".")[0]
+            # Extract the next collection date
+            if "Your next collection date is" in schedule_text:
+                start_index = schedule_text.index("Your next collection date is") + len(
+                    "Your next collection date is"
+                )
+                next_collection_date = (
+                    schedule_text[start_index:].strip().split("\n")[0].strip()
+                )
+            else:
+                next_collection_date = get_next_day_of_week(day, date_format)
+            dict_data = {
+                "type": bin_type,
+                "collectionDate": next_collection_date,
+            }
+            bindata["bins"].append(dict_data)
+        return bindata

uk_bin_collection/uk_bin_collection/councils/MidSuffolkDistrictCouncil.py CHANGED Viewed

@@ -24,6 +24,7 @@ class CouncilClass(AbstractGetBinDataClass):
         collection_day = kwargs.get("paon")
         garden_collection_week = kwargs.get("postcode")
+        garden_collection_day = kwargs.get("uprn")
         bindata = {"bins": []}
         days_of_week = [
@@ -42,6 +43,7 @@ class CouncilClass(AbstractGetBinDataClass):
         recyclingstartDate = datetime(2024, 11, 4)
         offset_days = days_of_week.index(collection_day)
+        offset_days_garden = days_of_week.index(garden_collection_day)
         if garden_collection_week:
             garden_collection = garden_week.index(garden_collection_week)
@@ -155,7 +157,7 @@ class CouncilClass(AbstractGetBinDataClass):
                 collection_date = (
                     datetime.strptime(gardenDate, "%d/%m/%Y")
-                    + timedelta(days=offset_days)
+                    + timedelta(days=offset_days_garden)
                 ).strftime("%d/%m/%Y")
                 garden_holiday = next(

uk_bin_collection/uk_bin_collection/councils/MorayCouncil.py ADDED Viewed

@@ -0,0 +1,65 @@
+import requests
+from bs4 import BeautifulSoup
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_uprn = kwargs.get("uprn")
+        bindata = {"bins": []}
+        user_uprn = user_uprn.zfill(8)
+        year = datetime.today().year
+        response = requests.get(
+            f"https://bindayfinder.moray.gov.uk/cal_{year}_view.php",
+            params={"id": user_uprn},
+        )
+        if response.status_code != 200:
+            # fall back to known good calendar URL
+            response = requests.get(
+                "https://bindayfinder.moray.gov.uk/cal_2024_view.php",
+                params={"id": user_uprn},
+            )
+        soup = BeautifulSoup(response.text, "html.parser")
+        bin_types = {
+            "G": "Green",
+            "B": "Brown",
+            "P": "Purple",
+            "C": "Blue",
+            "O": "Orange",
+        }
+        for month_container in soup.findAll("div", class_="month-container"):
+            for div in month_container.findAll("div"):
+                if "month-header" in div["class"]:
+                    month = div.text
+                elif div["class"] and div["class"][0] in ["B", "GPOC", "GBPOC"]:
+                    bins = div["class"][0]
+                    dom = int(div.text)
+                    for i in bins:
+                        dict_data = {
+                            "type": bin_types.get(i),
+                            "collectionDate": datetime.strptime(
+                                f"{dom} {month} {year}",
+                                "%d %B %Y",
+                            ).strftime("%d/%m/%Y"),
+                        }
+                        bindata["bins"].append(dict_data)
+        bindata["bins"].sort(
+            key=lambda x: datetime.strptime(x.get("collectionDate"), "%d/%m/%Y")
+        )
+        return bindata

uk_bin_collection/uk_bin_collection/councils/NewcastleUnderLymeCouncil.py ADDED Viewed

@@ -0,0 +1,66 @@
+import requests
+from bs4 import BeautifulSoup
+from dateutil.relativedelta import relativedelta
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_uprn = kwargs.get("uprn")
+        check_uprn(user_uprn)
+        bindata = {"bins": []}
+        URI = f"https://www.newcastle-staffs.gov.uk/homepage/97/check-your-bin-day?uprn={user_uprn}"
+        # Make the GET request
+        response = requests.get(URI)
+        response.raise_for_status()
+        soup = BeautifulSoup(response.text, features="html.parser")
+        soup.prettify()
+        # Find the table
+        table = soup.find("table", {"class": "data-table"})
+        if table:
+            rows = table.find("tbody").find_all("tr")
+            for row in rows:
+                date = datetime.strptime(
+                    (
+                        row.find_all("td")[0]
+                        .get_text(strip=True)
+                        .replace("Date:", "")
+                        .strip()
+                    ),
+                    "%A %d %B",
+                ).replace(year=datetime.now().year)
+                if datetime.now().month > 10 and date.month < 3:
+                    date = date + relativedelta(years=1)
+                bin_types = (
+                    row.find_all("td")[1]
+                    .text.replace("Collection Type:", "")
+                    .splitlines()
+                )
+                for bin_type in bin_types:
+                    bin_type = bin_type.strip()
+                    if bin_type:
+                        dict_data = {
+                            "type": bin_type.strip(),
+                            "collectionDate": date.strftime("%d/%m/%Y"),
+                        }
+                        bindata["bins"].append(dict_data)
+        bindata["bins"].sort(
+            key=lambda x: datetime.strptime(x.get("collectionDate"), "%d/%m/%Y")
+        )
+        return bindata

uk_bin_collection/uk_bin_collection/councils/NorthHertfordshireDistrictCouncil.py ADDED Viewed

@@ -0,0 +1,93 @@
+import requests
+from bs4 import BeautifulSoup
+from uk_bin_collection.uk_bin_collection.common import *
+from uk_bin_collection.uk_bin_collection.get_bin_data import AbstractGetBinDataClass
+# import the wonderful Beautiful Soup and the URL grabber
+class CouncilClass(AbstractGetBinDataClass):
+    """
+    Concrete classes have to implement all abstract operations of the
+    base class. They can also override some operations with a default
+    implementation.
+    """
+    def parse_data(self, page: str, **kwargs) -> dict:
+        user_postcode = kwargs.get("postcode")
+        user_paon = kwargs.get("paon")
+        check_postcode(user_postcode)
+        check_paon(user_paon)
+        bindata = {"bins": []}
+        URI = "https://uhtn-wrp.whitespacews.com/"
+        session = requests.Session()
+        # get link from first page as has some kind of unique hash
+        r = session.get(
+            URI,
+        )
+        r.raise_for_status()
+        soup = BeautifulSoup(r.text, features="html.parser")
+        alink = soup.find("a", text="Find my bin collection day")
+        if alink is None:
+            raise Exception("Initial page did not load correctly")
+        # greplace 'seq' query string to skip next step
+        nextpageurl = alink["href"].replace("seq=1", "seq=2")
+        data = {
+            "address_name_number": user_paon,
+            "address_postcode": user_postcode,
+        }
+        # get list of addresses
+        r = session.post(nextpageurl, data)
+        r.raise_for_status()
+        soup = BeautifulSoup(r.text, features="html.parser")
+        # get first address (if you don't enter enough argument values this won't find the right address)
+        alink = soup.find("div", id="property_list").find("a")
+        if alink is None:
+            raise Exception("Address not found")
+        nextpageurl = URI + alink["href"]
+        # get collection page
+        r = session.get(
+            nextpageurl,
+        )
+        r.raise_for_status()
+        soup = BeautifulSoup(r.text, features="html.parser")
+        if soup.find("span", id="waste-hint"):
+            raise Exception("No scheduled services at this address")
+        u1s = soup.find("section", id="scheduled-collections").find_all("u1")
+        for u1 in u1s:
+            lis = u1.find_all("li", recursive=False)
+            date = lis[1].text.replace("\n", "")
+            bin_type = lis[2].text.replace("\n", "")
+            dict_data = {
+                "type": bin_type,
+                "collectionDate": datetime.strptime(
+                    date,
+                    "%d/%m/%Y",
+                ).strftime(date_format),
+            }
+            bindata["bins"].append(dict_data)
+        bindata["bins"].sort(
+            key=lambda x: datetime.strptime(x.get("collectionDate"), date_format)
+        )
+        return bindata

uk_bin_collection 0.119.0__py3-none-any.whl → 0.121.0__py3-none-any.whl

uk_bin_collection 0.119.0py3-none-any.whl → 0.121.0py3-none-any.whl