mampfes · 5ila5 · Dec 18, 2024 · Dec 11, 2024 · Dec 18, 2024 · Dec 18, 2024
diff --git a/custom_components/waste_collection_schedule/waste_collection_schedule/source/poznan_pl.py b/custom_components/waste_collection_schedule/waste_collection_schedule/source/poznan_pl.py
@@ -1,6 +1,5 @@
 import datetime
 import logging
-import re
 
 import requests
 from bs4 import BeautifulSoup, Tag
@@ -22,13 +21,13 @@
 API_URL = "https://www.poznan.pl/mim/odpady/harmonogramy.html"
 
 ICON_MAP = {
-    1: "mdi:trash-can",
-    2: "mdi:recycle",
-    3: "mdi:recycle",
-    4: "mdi:recycle",
-    5: "mdi:recycle",
-    6: "mdi:recycle",
-    7: "mdi:trash-can",
+    "Odpady zmieszane": "mdi:trash-can",
+    "Papier": "mdi:newspaper-variant-outline",
+    "Metale i tworzywa sztuczne": "mdi:bottle-soda-classic-outline",
+    "Szkło": "mdi:glass-fragile",
+    "Bioodpady": "mdi:recycle",
+    "Odpady wystawkowe": "mdi:cupboard",
+    "Drzewka świąteczne": "mdi:pine-tree",
 }
 
 
@@ -48,34 +47,33 @@ def fetch(self) -> list[Collection]:
         r = requests.post(f"{API_URL}", data)
         r.raise_for_status()
 
-        # Fix their broken html table
-        fixed_text = re.sub(r"</td>\s*<tr>\s*<tr>\s*<td", "</td></tr><tr><td", r.text)
-        fixed_text = re.sub(
-            r"</th>\s*<tr>\s*<tr>\s*<td", "</td></tr><tr><td", fixed_text
-        )
+        soup = BeautifulSoup(r.text, "html.parser")
 
-        soup = BeautifulSoup(fixed_text, "html.parser")
+        year = datetime.date.today().year
+        month = datetime.date.today().month
 
-        table = soup.find("table")
+        table = soup.find("table", id="schedule_0")
         if not isinstance(table, Tag):
             raise Exception("Invalid address")
 
         year = datetime.date.today().year
+        month = datetime.date.today().month
+        formatted_date = f"{month}.{year}"
 
         # find all non empty tr's
         trs = [
             tr for tr in table.find_all("tr") if isinstance(tr, Tag) and tr.find_all()
         ]
         entries = []
-        name_map = [th.text.strip() for th in table.find_all("th")]
 
-        for row_index, row in enumerate(trs):
-            if row_index == 0 or row_index > 12:
-                continue
-            for cell_index, cell in enumerate(row.find_all("td")):
+        for row in trs[1:]:  # Skipping first row since it is a header
+            all_cells = row.find_all("td")
+            collection_name = all_cells[0].text.strip()
+            # iterate over all rows with dates without collection name
+            for cell in all_cells[1:]:
                 if (
-                    cell_index == 0
-                    or not isinstance(cell, Tag)
+                    not isinstance(cell, Tag)
+                    or not cell["data-value"] == formatted_date
                     or not cell.text.strip()
                 ):
                     continue
@@ -84,9 +82,9 @@ def fetch(self) -> list[Collection]:
                     day = day.strip()
                     entries.append(
                         Collection(
-                            datetime.date(year, row_index, int(day)),
-                            name_map[cell_index],
-                            ICON_MAP[cell_index],
+                            datetime.date(year, month, int(day)),
+                            collection_name,
+                            ICON_MAP.get(collection_name, "mdi:recycle"),
                         )
                     )