TopDownHockey-Scraper 4.1.3__tar.gz → 4.2.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of TopDownHockey-Scraper might be problematic. Click here for more details.

@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: TopDownHockey_Scraper
3
- Version: 4.1.3
3
+ Version: 4.2.0
4
4
  Summary: The TopDownHockey Scraper
5
5
  Home-page: https://github.com/TopDownHockey/TopDownHockey_Scraper
6
6
  Author: Patrick Bacon
@@ -1,6 +1,6 @@
1
1
  [metadata]
2
2
  name = TopDownHockey_Scraper
3
- version = 4.1.3
3
+ version = 4.2.0
4
4
  author = Patrick Bacon
5
5
  author_email = patrick.s.bacon@gmail.com
6
6
  description = A package built for scraping hockey data from EliteProspects, the NHL's HTML/API reports, and ESPN's XML reports.
@@ -9,7 +9,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
9
9
 
10
10
  setup(
11
11
  name="TopDownHockey_Scraper", # Replace with your own username
12
- version="4.1.3",
12
+ version="4.2.0",
13
13
  author="Patrick Bacon",
14
14
  author_email="patrick.s.bacon@gmail.com",
15
15
  description="The TopDownHockey Scraper",
@@ -490,7 +490,19 @@ def scrape_html_roster(season, game_id):
490
490
  (np.where(roster_df['Name']== "NICHOLAS PAUL" , "NICK PAUL",
491
491
  (np.where(roster_df['Name']== "JACOB MIDDLETON" , "JAKE MIDDLETON",
492
492
  (np.where(roster_df['Name']== "TOMMY NOVAK" , "THOMAS NOVAK",
493
- roster_df['Name']))))))))
493
+ # New guys from 24-25
494
+ (np.where(roster_df['Name']== "JOSHUA NORRIS" , "JOSH NORRIS",
495
+ (np.where(roster_df['Name']== "P.O JOSEPH" , "PIERRE-OLIVIER JOSEPH",
496
+ (np.where(roster_df['Name']== "MIKEY EYSSIMONT" , "MICHAEL EYSSIMONT",
497
+ (np.where(roster_df['Name']== "MATAJ BLAMEL" , "MATAJ BLAMEL",
498
+ (np.where(roster_df['Name']== "VITTORIO MANCINI" , "VICTOR MANCINI",
499
+ (np.where(roster_df['Name']== "JOSHUA MAHURA" , "JOSH MAHURA",
500
+ (np.where(roster_df['Name']== "JOSEPH VELENO" , "JOE VELENO",
501
+ (np.where(roster_df['Name']== "ZACK BOLDUC" , "ZACHARY BOLDUC",
502
+ (np.where(roster_df['Name']== "JOSHUA BROWN" , "JOSH BROWN",
503
+ (np.where(roster_df['Name']== "JAKE LUCCHINI" , "JACOB LUCCHINI",
504
+ (np.where(roster_df['Name']== "EMIL LILLEBERG" , "EMIL MARTINSEN LILLEBERG",
505
+ roster_df['Name']))))))))))))))))))))))))))))))
494
506
 
495
507
  roster_df['Name'] = roster_df['Name'].str.normalize('NFKD').str.encode('ascii', errors='ignore').str.decode('utf-8').str.upper()
496
508
 
@@ -1190,6 +1202,24 @@ def scrape_html_shifts(season, game_id):
1190
1202
  (np.where(all_shifts['name']== "JOSH DUNNE" , "JOSHUA DUNNE",all_shifts['name'])))))))))))))))))))))))))))))))))))))))))))
1191
1203
  )))))))))))))))))))))))))))))))))))))
1192
1204
 
1205
+ all_shifts['name'] = (np.where(all_shifts['name']== "JANIS MOSER" , "J.J. MOSER",
1206
+ (np.where(all_shifts['name']== "NICHOLAS PAUL" , "NICK PAUL",
1207
+ (np.where(all_shifts['name']== "JACOB MIDDLETON" , "JAKE MIDDLETON",
1208
+ (np.where(all_shifts['name']== "TOMMY NOVAK" , "THOMAS NOVAK",
1209
+ # New guys from 24-25
1210
+ (np.where(all_shifts['name']== "JOSHUA NORRIS" , "JOSH NORRIS",
1211
+ (np.where(all_shifts['name']== "P.O JOSEPH" , "PIERRE-OLIVIER JOSEPH",
1212
+ (np.where(all_shifts['name']== "MIKEY EYSSIMONT" , "MICHAEL EYSSIMONT",
1213
+ (np.where(all_shifts['name']== "MATAJ BLAMEL" , "MATAJ BLAMEL",
1214
+ (np.where(all_shifts['name']== "VITTORIO MANCINI" , "VICTOR MANCINI",
1215
+ (np.where(all_shifts['name']== "JOSHUA MAHURA" , "JOSH MAHURA",
1216
+ (np.where(all_shifts['name']== "JOSEPH VELENO" , "JOE VELENO",
1217
+ (np.where(all_shifts['name']== "ZACK BOLDUC" , "ZACHARY BOLDUC",
1218
+ (np.where(all_shifts['name']== "JOSHUA BROWN" , "JOSH BROWN",
1219
+ (np.where(all_shifts['name']== "JAKE LUCCHINI" , "JACOB LUCCHINI",
1220
+ (np.where(all_shifts['name']== "EMIL LILLEBERG" , "EMIL MARTINSEN LILLEBERG",
1221
+ all_shifts['name']))))))))))))))))))))))))))))))
1222
+
1193
1223
  all_shifts['name'] = all_shifts['name'].str.normalize('NFKD').str.encode('ascii', errors='ignore').str.decode('utf-8').str.upper()
1194
1224
 
1195
1225
 
@@ -1492,6 +1522,25 @@ def scrape_api_events(game_id, drop_description = True, shift_to_espn = False):
1492
1522
  ))))))))))))))))))))))))))))))))))))))))))))))))))))))))))))
1493
1523
  )))))))))))))))))))))))))))))))))))))))))))))))
1494
1524
 
1525
+ api_events['ep1_name'] = (np.where(api_events['ep1_name']== "JANIS MOSER" , "J.J. MOSER",
1526
+ (np.where(api_events['ep1_name']== "NICHOLAS PAUL" , "NICK PAUL",
1527
+ (np.where(api_events['ep1_name']== "JACOB MIDDLETON" , "JAKE MIDDLETON",
1528
+ (np.where(api_events['ep1_name']== "TOMMY NOVAK" , "THOMAS NOVAK",
1529
+ # New guys from 24-25
1530
+ (np.where(api_events['ep1_name']== "JOSHUA NORRIS" , "JOSH NORRIS",
1531
+ (np.where(api_events['ep1_name']== "P.O JOSEPH" , "PIERRE-OLIVIER JOSEPH",
1532
+ (np.where(api_events['ep1_name']== "MIKEY EYSSIMONT" , "MICHAEL EYSSIMONT",
1533
+ (np.where(api_events['ep1_name']== "MATAJ BLAMEL" , "MATAJ BLAMEL",
1534
+ (np.where(api_events['ep1_name']== "VITTORIO MANCINI" , "VICTOR MANCINI",
1535
+ (np.where(api_events['ep1_name']== "JOSHUA MAHURA" , "JOSH MAHURA",
1536
+ (np.where(api_events['ep1_name']== "JOSEPH VELENO" , "JOE VELENO",
1537
+ (np.where(api_events['ep1_name']== "ZACK BOLDUC" , "ZACHARY BOLDUC",
1538
+ (np.where(api_events['ep1_name']== "JOSHUA BROWN" , "JOSH BROWN",
1539
+ (np.where(api_events['ep1_name']== "JAKE LUCCHINI" , "JACOB LUCCHINI",
1540
+ (np.where(api_events['ep1_name']== "EMIL LILLEBERG" , "EMIL MARTINSEN LILLEBERG",
1541
+ api_events['ep1_name']))))))))))))))))))))))))))))))
1542
+
1543
+
1495
1544
  # 21-22 CHANGES
1496
1545
 
1497
1546
  api_events['ep1_name'] = api_events['ep1_name'].str.normalize('NFKD').str.encode('ascii', errors='ignore').str.decode('utf-8').str.upper()
@@ -1852,11 +1901,29 @@ def scrape_espn_events(espn_game_id, drop_description = True):
1852
1901
  (np.where(espn_events['event_player_1']== "TOMMY NOVAK" , "THOMAS NOVAK",
1853
1902
  espn_events['event_player_1']))))))))
1854
1903
 
1855
- espn_events['event_player_1'] = (np.where(espn_events['event_player_1']== "PAT MAROON" , "PATRICK MAROON",
1856
- (np.where(espn_events['event_player_1']== "JOHHNY BEECHER" , "JOHN BEECHER",
1904
+ espn_events['event_player_1'] = (np.where(espn_events['event_player_1']== "JOHHNY BEECHER" , "JOHN BEECHER",
1857
1905
  (np.where(espn_events['event_player_1']== "ALEXANDER BARKOV" , "ALEKSANDER BARKOV",
1858
1906
  (np.where(espn_events['event_player_1']== "TOMMY NOVAK" , "THOMAS NOVAK",
1859
- espn_events['event_player_1']))))))))
1907
+ espn_events['event_player_1']))))))
1908
+
1909
+ espn_events['event_player_1'] = (np.where(espn_events['event_player_1']== "JANIS MOSER" , "J.J. MOSER",
1910
+ (np.where(espn_events['event_player_1']== "NICHOLAS PAUL" , "NICK PAUL",
1911
+ (np.where(espn_events['event_player_1']== "JACOB MIDDLETON" , "JAKE MIDDLETON",
1912
+ (np.where(espn_events['event_player_1']== "TOMMY NOVAK" , "THOMAS NOVAK",
1913
+ # New guys from 24-25
1914
+ (np.where(espn_events['event_player_1']== "JOSHUA NORRIS" , "JOSH NORRIS",
1915
+ (np.where(espn_events['event_player_1']== "P.O JOSEPH" , "PIERRE-OLIVIER JOSEPH",
1916
+ (np.where(espn_events['event_player_1']== "MIKEY EYSSIMONT" , "MICHAEL EYSSIMONT",
1917
+ (np.where(espn_events['event_player_1']== "MATAJ BLAMEL" , "MATAJ BLAMEL",
1918
+ (np.where(espn_events['event_player_1']== "VITTORIO MANCINI" , "VICTOR MANCINI",
1919
+ (np.where(espn_events['event_player_1']== "JOSHUA MAHURA" , "JOSH MAHURA",
1920
+ (np.where(espn_events['event_player_1']== "JOSEPH VELENO" , "JOE VELENO",
1921
+ (np.where(espn_events['event_player_1']== "ZACK BOLDUC" , "ZACHARY BOLDUC",
1922
+ (np.where(espn_events['event_player_1']== "JOSHUA BROWN" , "JOSH BROWN",
1923
+ (np.where(espn_events['event_player_1']== "JAKE LUCCHINI" , "JACOB LUCCHINI",
1924
+ (np.where(espn_events['event_player_1']== "EMIL LILLEBERG" , "EMIL MARTINSEN LILLEBERG",
1925
+ espn_events['event_player_1']))))))))))))))))))))))))))))))
1926
+
1860
1927
 
1861
1928
  espn_events = espn_events.assign(version =
1862
1929
  (np.where(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: TopDownHockey_Scraper
3
- Version: 4.1.3
3
+ Version: 4.2.0
4
4
  Summary: The TopDownHockey Scraper
5
5
  Home-page: https://github.com/TopDownHockey/TopDownHockey_Scraper
6
6
  Author: Patrick Bacon