warn-scraper 1.2.76__py3-none-any.whl → 1.2.78__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
warn/scrapers/ca.py CHANGED
@@ -138,23 +138,24 @@ def _extract_excel_data(wb_path):
138
138
  # Loop through all the rows
139
139
  payload = []
140
140
  for row in rows:
141
- first_cell = row[0].value.strip().lower()
142
- # Exit if we've reached summary row at bottom
143
- if first_cell == "report summary":
144
- break
145
-
146
- data = {
147
- "county": row[0].value.strip(),
148
- "notice_date": _convert_date(row[1].value),
149
- "received_date": _convert_date(row[2].value),
150
- "effective_date": _convert_date(row[3].value),
151
- "company": row[4].value.strip(),
152
- "layoff_or_closure": row[5].value.strip(),
153
- "num_employees": row[num_employees_index].value,
154
- "address": row[address_index].value.strip(),
155
- "source_file": str(wb_path).split("/")[-1],
156
- }
157
- payload.append(data)
141
+ if row[0].value:
142
+ first_cell = row[0].value.strip().lower()
143
+ # Exit if we've reached summary row at bottom
144
+ if first_cell == "report summary":
145
+ break
146
+
147
+ data = {
148
+ "county": row[0].value.strip(),
149
+ "notice_date": _convert_date(row[1].value),
150
+ "received_date": _convert_date(row[2].value),
151
+ "effective_date": _convert_date(row[3].value),
152
+ "company": row[4].value.strip(),
153
+ "layoff_or_closure": row[5].value.strip(),
154
+ "num_employees": row[num_employees_index].value,
155
+ "address": row[address_index].value.strip(),
156
+ "source_file": str(wb_path).split("/")[-1],
157
+ }
158
+ payload.append(data)
158
159
  return payload
159
160
 
160
161
 
warn/scrapers/id.py CHANGED
@@ -53,7 +53,7 @@ def scrape(
53
53
  # Start finding the link before "Who to contact"
54
54
  html = r.text
55
55
  localizedhtml = html.split("<h2>Who to contact")[0]
56
- soup = BeautifulSoup(localizedhtml, features="lxml")
56
+ soup = BeautifulSoup(localizedhtml, features="html5lib")
57
57
  last_url = soup.find_all("a")[-1]["href"]
58
58
  pdf_url = f"{base_url}{last_url}"
59
59
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: warn-scraper
3
- Version: 1.2.76
3
+ Version: 1.2.78
4
4
  Summary: Command-line interface for downloading WARN Act notices of qualified plant closings and mass layoffs from state government websites
5
5
  Home-page: https://github.com/biglocalnews/warn-scraper
6
6
  Author: Big Local News
@@ -28,7 +28,7 @@ warn/scrapers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
28
28
  warn/scrapers/ak.py,sha256=h7BYMTV0whwWAPhbzVDVKMMoVCFphKly70aiTHabPq4,1847
29
29
  warn/scrapers/al.py,sha256=D0rT9GQ0vwfkRuveVAt-Po-T6b2TI1EPGeLOBy2m3_M,2240
30
30
  warn/scrapers/az.py,sha256=elGbue01Gjf_DQ66Wy9qqGIOJsiY-KIKJOVeft8pCXg,1447
31
- warn/scrapers/ca.py,sha256=rBTB-6LmNIlbGCqrCtI3O-w2e_0kcVSFxvjvh4EHBlk,8511
31
+ warn/scrapers/ca.py,sha256=VQOfjHXPCc-jYwh-EPGVVfnzvXB7pdmCt2uJ6QnMPRM,8600
32
32
  warn/scrapers/co.py,sha256=g076Zqe8XA8tbW03HP6-03mJV8fft1niHfa5Sy6me9A,7388
33
33
  warn/scrapers/ct.py,sha256=HLMmBSFhT5Y3vZQUwRyCTxiG5BMQXTfG3SEj5rkQEL4,4771
34
34
  warn/scrapers/dc.py,sha256=_sHLnVqK_W90QqJb_W88yDlgPjoMl63LYZP3CJfdN9g,4484
@@ -37,7 +37,7 @@ warn/scrapers/fl.py,sha256=YJ6Qt-jJZ7_iUKlHDaQuaV2gRmae8AJKS5dwwChadBE,9563
37
37
  warn/scrapers/ga.py,sha256=iuvXoP5nPEnjm8wiEWhtBwLnkdmElhJILin3No5HIyo,7412
38
38
  warn/scrapers/hi.py,sha256=pSplAP15_ZBfQtcywyErmvNcrk7u55TjZj_F0Nqw9L8,5660
39
39
  warn/scrapers/ia.py,sha256=zOncaA9M0d6paT4pB7UU_4D_yxUgeUiGRcnpKi9DsRA,1999
40
- warn/scrapers/id.py,sha256=rJBoJGpREP72ovZnxeulkdX_umEi4aEbcZUW3v0VqlA,5853
40
+ warn/scrapers/id.py,sha256=FldJHv8sqBVKIdq7YlOK_O3Uh2Xj9i0WL7wQgszBgTA,5857
41
41
  warn/scrapers/il.py,sha256=sygdvsNuB_Gvu3o_HidtpSP4FLz0szKb1zEHqGxVtlI,1563
42
42
  warn/scrapers/in.py,sha256=dAT40ROhhKiwLcwa_YJ6EyhsYBLe0IX2rOWXmNa6JMs,2026
43
43
  warn/scrapers/ks.py,sha256=F_3biEMF7zgCX2XVuUACR74Vyzapta4SaM9SY3EuZCU,1266
@@ -65,9 +65,9 @@ warn/scrapers/va.py,sha256=13lhkQrSkPGHEiWUuf1qiS890PWYE5gV-TgISpoiQnc,1711
65
65
  warn/scrapers/vt.py,sha256=d-bo4WK2hkrk4BhCCmLpEovcoZltlvdIUB6O0uaMx5A,1186
66
66
  warn/scrapers/wa.py,sha256=UXdVtHZo_a-XfoiyOooTRfTb9W3PErSZdKca6SRORgs,4282
67
67
  warn/scrapers/wi.py,sha256=ClEzXkwZbop0W4fkQgsb5oHAPUrb4luUPGV-jOKwkcg,4855
68
- warn_scraper-1.2.76.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
69
- warn_scraper-1.2.76.dist-info/METADATA,sha256=Adb8KydFcC46yyPoAb06yPV33sEgYxMiQRmx6Z2k9jA,2025
70
- warn_scraper-1.2.76.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
71
- warn_scraper-1.2.76.dist-info/entry_points.txt,sha256=poh_oSweObGlBSs1_2qZmnTodlOYD0KfO7-h7W2UQIw,47
72
- warn_scraper-1.2.76.dist-info/top_level.txt,sha256=gOhHgNEkrUvajlzoKkVOo-TlQht9MoXnKOErjzqLGHo,11
73
- warn_scraper-1.2.76.dist-info/RECORD,,
68
+ warn_scraper-1.2.78.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
69
+ warn_scraper-1.2.78.dist-info/METADATA,sha256=6GsM9rlqqDjF5QQ5eVR_MJXNH8JJd3lji3jFbDeudYc,2025
70
+ warn_scraper-1.2.78.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
71
+ warn_scraper-1.2.78.dist-info/entry_points.txt,sha256=poh_oSweObGlBSs1_2qZmnTodlOYD0KfO7-h7W2UQIw,47
72
+ warn_scraper-1.2.78.dist-info/top_level.txt,sha256=gOhHgNEkrUvajlzoKkVOo-TlQht9MoXnKOErjzqLGHo,11
73
+ warn_scraper-1.2.78.dist-info/RECORD,,