PyPI - pybaseballstats - Versions diffs - 0.0.1__tar.gz - Mend

pybaseballstats 0.0.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

pybaseballstats-0.0.1/PKG-INFO +27 -0
pybaseballstats-0.0.1/README.md +11 -0
pybaseballstats-0.0.1/pybaseballstats/__init__.py +4 -0
pybaseballstats-0.0.1/pybaseballstats/fangraphs.py +214 -0
pybaseballstats-0.0.1/pybaseballstats/statcast.py +76 -0
pybaseballstats-0.0.1/pybaseballstats/statcast_utils.py +178 -0
pybaseballstats-0.0.1/pybaseballstats.egg-info/PKG-INFO +27 -0
pybaseballstats-0.0.1/pybaseballstats.egg-info/SOURCES.txt +12 -0
pybaseballstats-0.0.1/pybaseballstats.egg-info/dependency_links.txt +1 -0
pybaseballstats-0.0.1/pybaseballstats.egg-info/requires.txt +9 -0
pybaseballstats-0.0.1/pybaseballstats.egg-info/top_level.txt +1 -0
pybaseballstats-0.0.1/pyproject.toml +17 -0
pybaseballstats-0.0.1/setup.cfg +4 -0
pybaseballstats-0.0.1/setup.py +8 -0

pybaseballstats-0.0.1/PKG-INFO ADDED Viewed

@@ -0,0 +1,27 @@
+Metadata-Version: 2.2
+Name: pybaseballstats
+Version: 0.0.1
+Summary: A Python package for scraping baseball data.
+Requires-Python: >=3.13
+Description-Content-Type: text/markdown
+Requires-Dist: aiohttp>=3.11.11
+Requires-Dist: asyncio>=3.4.3
+Requires-Dist: bs4>=0.0.2
+Requires-Dist: pandas>=2.2.3
+Requires-Dist: polars>=1.20.0
+Requires-Dist: pytest>=8.3.4
+Requires-Dist: ruff>=0.9.3
+Requires-Dist: setuptools>=75.8.0
+Requires-Dist: tqdm>=4.67.1
+# pybaseballstats
+A Python package for scraping baseball statistics from the web. Inspired by the pybaseball package by James LeDoux. This package is a work in progress and is not yet ready for use.
+## Available Sources
+1. Baseball Savant
+## Usage
+Usage documentation can be found at /usage_docs/

pybaseballstats-0.0.1/README.md ADDED Viewed

@@ -0,0 +1,11 @@
+# pybaseballstats
+A Python package for scraping baseball statistics from the web. Inspired by the pybaseball package by James LeDoux. This package is a work in progress and is not yet ready for use.
+## Available Sources
+1. Baseball Savant
+## Usage
+Usage documentation can be found at /usage_docs/

pybaseballstats-0.0.1/pybaseballstats/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+from .fangraphs import (  # noqa: F401
+    show_fangraphs_batting_stat_types,
+)
+from .statcast import statcast_date_range, statcast_single_game  # noqa: F401

pybaseballstats-0.0.1/pybaseballstats/fangraphs.py ADDED Viewed

@@ -0,0 +1,214 @@
+from enum import Enum
+from typing import List
+import pandas as pd
+import polars as pl
+import requests
+from bs4 import BeautifulSoup
+url = "https://www.fangraphs.com/leaders/major-league?pos={pos}&stats=bat&lg={league}&qual={qual}&type={stat_type}&season={end_season}&season1={start_season}&ind=0&startdate={start_date}&enddate={end_date}&month=0&team=0&pagenum=1&pageitems=2000000000"
+# pos options: c, 1b,2b,3b, ss, lf, cf, rf, dh, of, p, all
+# qual options: y, n
+# league options: "", "al", "nl"
+# start date, end date are strings in the format "yyyy-mm-dd"
+# stat options: 8 (dashboard), 0 (standard), 1 (advanced), 2 (batted ball), 3 (win_probability), 6 (value), 23 (+stats),24 (statcast), 48 (violations)
+# Define the available stat types as an Enum
+class FangraphsBattingStatType(Enum):
+    DASHBOARD = 8
+    STANDARD = 0
+    ADVANCED = 1
+    BATTED_BALL = 2
+    WIN_PROBABILITY = 3
+    VALUE = 6
+    PLUS_STATS = 23
+    STATCAST = 24
+    VIOLATIONS = 48
+def get_table_data(
+    stat_type, pos, league, start_date, end_date, qual, start_season, end_season
+):
+    # Assuming `cont` contains the HTML content
+    cont = requests.get(
+        url.format(
+            pos="all",
+            league="",
+            stat_type=stat_type,
+            start_season=1900,
+            end_season=2024,
+            qual="y",
+            start_date="",
+            end_date="",
+        )
+    ).content.decode("utf-8")
+    # Parse the HTML content with BeautifulSoup
+    soup = BeautifulSoup(cont, "html.parser")
+    # Find the main table using the provided CSS selector
+    main_table = soup.select_one(
+        "#content > div.leaders-major_leaders-major__table__hcmbm > div.fg-data-grid.table-type > div.table-wrapper-outer > div > div.table-scroll > table"
+    )
+    # Find the table header
+    thead = main_table.find("thead")
+    # Extract column names from the data-col-id attribute of the <th> elements, excluding "divider"
+    headers = [
+        th["data-col-id"]
+        for th in thead.find_all("th")
+        if "data-col-id" in th.attrs and th["data-col-id"] != "divider"
+    ]
+    # Find the table body within the main table
+    tbody = main_table.find("tbody")
+    # Initialize a list to store the extracted data
+    data = []
+    # Iterate over each row in the table body
+    for row in tbody.find_all("tr"):
+        row_data = {header: None for header in headers}  # Initialize with None
+        for cell in row.find_all("td"):
+            col_id = cell.get("data-col-id")
+            if col_id and col_id != "divider":
+                if cell.find("a"):
+                    row_data[col_id] = cell.find("a").text
+                elif cell.find("span"):
+                    row_data[col_id] = cell.find("span").text
+                else:
+                    text = cell.text.strip().replace("%", "")
+                    if text == "":
+                        row_data[col_id] = None
+                    else:
+                        try:
+                            row_data[col_id] = float(text) if "." in text else int(text)
+                        except ValueError:
+                            row_data[col_id] = text
+        # Print row_data for debugging
+        data.append(row_data)
+    # Create a Polars DataFrame from the extracted data
+    df = pl.DataFrame(data)
+    return df
+def show_fangraphs_batting_stat_types():
+    for stat_type in FangraphsBattingStatType:
+        print(stat_type)
+def show_batting_pos_options():
+    print("c,1b,2b,3b,ss,lf,cf,rf,dh,of,p,all")
+def fangraphs_batting_date_range(
+    start_date: str,
+    end_date: str,
+    stat_types: List[FangraphsBattingStatType] = None,
+    return_pandas: bool = False,
+    pos: str = "all",
+    league: str = "",
+    qual: str = "y",
+) -> pl.DataFrame | pd.DataFrame:
+    """Pulls Fangraphs batting data for a date range.
+    Args:
+        start_date (str): format "yyyy-mm-dd", ex) "2021-04-01"
+        end_date (str): format "yyyy-mm-dd", ex) "2021-04-01"
+        stat_types (List[FangraphsBattingStatType], optional): List of what Fangraphs stat types to include, more information can be found by calling pyb.show_fangraphs_stat_types(). Defaults to None, meaning all stat types will be returned.
+        return_pandas (bool, optional): whether to return a Polars Dataframe (False) or a Pandas Dataframe (True). Defaults to False.
+        pos (str, optional): What positions to return data for. More information can be found by calling pyb.show_batting_pos_options(). Defaults to "all".
+        league (str, optional): What league to return data for, options are ""(all), "nl", "al". Defaults to "".
+        qual (str, optional): whether or not to restrict to qualified batters, to return unqualified batters pass "n" as the argument. Defaults to "y".
+    Returns:
+        pl.DataFrame | pd.DataFrame: The requested data as a Polars or Pandas DataFrame.
+    """
+    df_list = []
+    if stat_types is None:
+        stat_types = FangraphsBattingStatType
+    if len(stat_types) == 0:
+        print(
+            "Warning: No stat types provided, returning None, to return all stattypes, pass in None."
+        )
+        return None
+    for stat_type in stat_types:
+        print(f"Fetching data for {stat_type}...")
+        df = get_table_data(
+            stat_type=stat_types[stat_type.value],
+            pos=pos,
+            league=league,
+            start_date=start_date,
+            end_date=end_date,
+            qual=qual,
+            start_season="",
+            end_season="",
+        )
+        if df is not None:
+            print(f"Data fetched for {stat_type}")
+            df_list.append(df)
+        else:
+            print(f"Warning: No data returned for {stat_type}")
+    df = pl.concat(df_list, how="diagonal")
+    df = df.select(pl.col("Name").drop_nulls())
+    return df.to_pandas() if return_pandas else df
+def fangraphs_batting_season_range(
+    start_season,
+    end_season,
+    stat_types,
+    return_pandas=False,
+    pos="all",
+    league="",
+    qual="y",
+) -> pl.DataFrame | pd.DataFrame:
+    df_list = []
+    if stat_types is None:
+        stat_types = FangraphsBattingStatType
+    if len(stat_types) == 0:
+        print(
+            "Warning: No stat types provided, returning None, to return all stattypes, pass in None."
+        )
+        return None
+    for stat_type in stat_types:
+        print(f"Fetching data for {stat_type}...")
+        df = get_table_data(
+            stat_type=stat_types[stat_type.value],
+            pos=pos,
+            league=league,
+            start_date="",
+            end_date="",
+            qual=qual,
+            start_season=start_season,
+            end_season=end_season,
+        )
+        if df is not None:
+            print(f"Data fetched for {stat_type}")
+            df_list.append(df)
+        else:
+            print(f"Warning: No data returned for {stat_type}")
+    df = pl.concat(df_list, how="diagonal")
+    df = df.select(pl.col("Name").drop_nulls())
+    return df.to_pandas() if return_pandas else df
+def fangraphs_pitching_date_range():
+    print("Not implemented yet.")
+def fangraphs_pitching_season_range():
+    print("Not implemented yet.")
+def fangraphs_fielding_date_range():
+    print("Not implemented yet.")
+def fangraphs_fielding_season_range():
+    print("Not implemented yet.")

pybaseballstats-0.0.1/pybaseballstats/statcast.py ADDED Viewed

@@ -0,0 +1,76 @@
+import asyncio
+import io
+import logging as logger
+import pandas as pd
+import polars as pl
+import requests
+from .statcast_utils import (
+    ROOT_URL,
+    SINGLE_GAME,
+    _add_extra_stats,
+    _statcast_date_range_helper,
+)
+def statcast_single_game(
+    game_pk: int, extra_stats: bool, return_pandas: bool = False
+) -> pl.LazyFrame | pd.DataFrame:
+    """Pulls statcast data for a single game.
+    Args:
+        game_pk (int): game_pk of the game you want to pull data for
+        extra_stats (bool): whether or not to include extra stats
+        return_pandas (bool, optional): whether or not to return as a Pandas DataFrame. Defaults to False (returns Polars LazyFrame).
+    Returns:
+        pl.LazyFrame | pd.DataFrame: DataFrame of statcast data for the game
+    """
+    try:
+        statcast_content = requests.get(
+            ROOT_URL + SINGLE_GAME.format(game_pk=game_pk), timeout=None
+        ).content
+    except Exception as e:
+        logger.error(f"Failed to pull data for game_pk: {game_pk}. {str(e)}")
+        return pl.LazyFrame() if not return_pandas else pd.DataFrame()
+    if not extra_stats:
+        return (
+            pl.scan_csv(io.StringIO(statcast_content.decode("utf-8")))
+            if not return_pandas
+            else pd.read_csv(io.StringIO(statcast_content.decode("utf-8")))
+        )
+    else:
+        df = pl.scan_csv(io.StringIO(statcast_content.decode("utf-8")))
+        start_dt = df.select(pl.col("game_date").min())
+        end_dt = df.select(pl.col("game_date").max())
+        return asyncio.run(_add_extra_stats(df, start_dt, end_dt, return_pandas))
+def statcast_date_range(
+    start_dt: str,
+    end_dt: str,
+    team: str = None,
+    extra_stats: bool = False,
+    return_pandas: bool = False,
+) -> pl.LazyFrame | pd.DataFrame:
+    """
+    Pulls statcast data for a date range.
+    Args:
+    start_dt: the start date in 'YYYY-MM-DD' format
+    end_dt: the end date in 'YYYY-MM-DD' format
+    team: the team abbreviation (e.g. 'WSH'). If None, data for all teams will be returned.
+    extra_stats: whether to include extra stats
+    return_pandas: whether to return a pandas DataFrame (default is False, returning a Polars LazyFrame)
+    Returns:
+    A DataFrame of statcast data for the date range.
+    """
+    async def async_statcast():
+        return await _statcast_date_range_helper(
+            start_dt, end_dt, team, extra_stats, return_pandas
+        )
+    return asyncio.run(async_statcast())

pybaseballstats-0.0.1/pybaseballstats/statcast_utils.py ADDED Viewed

@@ -0,0 +1,178 @@
+import asyncio
+import datetime as dt
+from typing import Iterator, Tuple
+import aiohttp
+import pandas as pd
+import polars as pl
+from tqdm import tqdm
+from tqdm.asyncio import tqdm_asyncio
+# https://github.com/jldbc/pybaseball/blob/master/pybaseball/statcast.py
+# used for root_url, single_game, date_range
+ROOT_URL = "https://baseballsavant.mlb.com"
+SINGLE_GAME = "/statcast_search/csv?all=true&type=details&game_pk={game_pk}"
+DATE_RANGE = "/statcast_search/csv?all=true&hfPT=&hfAB=&hfBBT=&hfPR=&hfZ=&stadium=&hfBBL=&hfNewZones=&hfGT=R%7CPO%7CS%7C=&hfSea=&hfSit=&player_type=pitcher&hfOuts=&opponent=&pitcher_throws=&batter_stands=&hfSA=&game_date_gt={start_dt}&game_date_lt={end_dt}&team={team}&position=&hfRO=&home_road=&hfFlag=&metric_1=&hfInn=&min_pitches=0&min_results=0&group_by=name&sort_col=pitches&player_event_sort=h_launch_speed&sort_order=desc&min_abs=0&type=details&"
+# my own url
+EXTRA_STATS = "/statcast_search/csv?hfPT=&hfAB=&hfGT=R%7C&hfPR=&hfZ=&hfStadium=&hfBBL=&hfNewZones=&hfPull=&hfC=&hfSea=2024%7C2023%7C2022%7C2021%7C2020%7C2019%7C2018%7C2017%7C2016%7C2015%7C2014%7C2013%7C2012%7C2011%7C2010%7C2009%7C2008%7C&hfSit=&player_type={pos}&game_date_gt=&game_date_lt=&hfOuts=&hfOpponent=&pitcher_throws=&batter_stands=&hfSA=&hfMo=&hfTeam=&home_road=&hfRO=&position=&hfInfield=&hfOutfield=&hfInn=&hfBBT=&hfFlag=is%5C.%5C.remove%5C.%5C.bunts%7Cis%5C.%5C.competitive%7C&metric_1=&group_by=name&min_pitches=0&min_results=0&min_pas=0&sort_col=pitches&player_event_sort=api_p_release_speed&sort_order=desc&chk_stats_pa=on&chk_stats_abs=on&chk_stats_bip=on&chk_stats_hits=on&chk_stats_singles=on&chk_stats_dbls=on&chk_stats_triples=on&chk_stats_hrs=on&chk_stats_so=on&chk_stats_k_percent=on&chk_stats_bb=on&chk_stats_bb_percent=on&chk_stats_whiffs=on&chk_stats_swings=on&chk_stats_api_break_z_with_gravity=on&chk_stats_api_break_x_arm=on&chk_stats_api_break_z_induced=on&chk_stats_api_break_x_batter_in=on&chk_stats_ba=on&chk_stats_xba=on&chk_stats_xbadiff=on&chk_stats_obp=on&chk_stats_xobp=on&chk_stats_xobpdiff=on&chk_stats_slg=on&chk_stats_xslg=on&chk_stats_xslgdiff=on&chk_stats_woba=on&chk_stats_xwoba=on&chk_stats_wobadiff=on&chk_stats_barrels_total=on&chk_stats_babip=on&chk_stats_iso=on&chk_stats_run_exp=on&chk_stats_pitcher_run_exp=on&chk_stats_swing_miss_percent=on&chk_stats_batter_run_value_per_100=on&chk_stats_pitcher_run_value_per_100=on&chk_stats_velocity=on&chk_stats_effective_speed=on&chk_stats_spin_rate=on&chk_stats_release_pos_z=on&chk_stats_release_pos_x=on&chk_stats_release_extension=on&chk_stats_plate_x=on&chk_stats_plate_z=on&chk_stats_arm_angle=on&chk_stats_launch_speed=on&chk_stats_hyper_speed=on&chk_stats_sweetspot_speed_mph=on&chk_stats_launch_angle=on&chk_stats_bbdist=on&chk_stats_swing_length=on&chk_stats_hardhit_percent=on&chk_stats_barrels_per_bbe_percent=on&chk_stats_barrels_per_pa_percent=on&chk_stats_pos3_int_start_distance=on&chk_stats_pos4_int_start_distance=on&chk_stats_pos5_int_start_distance=on&chk_stats_pos6_int_start_distance=on&chk_stats_pos7_int_start_distance=on&chk_stats_pos8_int_start_distance=on&chk_stats_pos9_int_start_distance=on#results"
+YEAR_RANGES = {
+    2022: (dt.date(2022, 3, 17), dt.date(2022, 11, 5)),
+    2016: (dt.date(2016, 4, 3), dt.date(2016, 11, 2)),
+    2019: (dt.date(2019, 3, 20), dt.date(2019, 10, 30)),
+    2017: (dt.date(2017, 4, 2), dt.date(2017, 11, 1)),
+    2023: (dt.date(2023, 3, 15), dt.date(2023, 11, 1)),
+    2020: (dt.date(2020, 7, 23), dt.date(2020, 10, 27)),
+    2018: (dt.date(2018, 3, 29), dt.date(2018, 10, 28)),
+    2015: (dt.date(2015, 4, 5), dt.date(2015, 11, 1)),
+    2024: (dt.date(2024, 3, 15), dt.date(2024, 10, 25)),
+    2021: (dt.date(2021, 3, 15), dt.date(2021, 11, 2)),
+}
+STATCAST_DATE_FORMAT = "%Y-%m-%d"
+async def _fetch_data(session, url, retries=2):
+    for attempt in range(retries):
+        try:
+            async with session.get(url) as response:
+                return await response.read()
+        except aiohttp.ClientPayloadError as e:
+            if attempt < retries - 1:
+                await asyncio.sleep(1)  # Wait before retrying
+                print(f"Retrying... {retries - attempt - 1} attempts left.")
+                continue
+            else:
+                print(f"Failed to fetch data from {url}.")
+                raise e
+async def _fetch_all_data(urls):
+    async with aiohttp.ClientSession() as session:
+        tasks = [_fetch_data(session, url) for url in urls]
+        return await tqdm_asyncio.gather(*tasks, desc="Fetching data")
+async def _statcast_date_range_helper(
+    start_dt: str,
+    end_dt: str,
+    team: str = None,
+    extra_stats: bool = False,
+    return_pandas: bool = False,
+) -> pl.LazyFrame | pd.DataFrame:
+    """
+    Pulls statcast data for a date range.
+    Args:
+    start_dt: the start date in 'YYYY-MM-DD' format
+    end_dt: the end date in 'YYYY-MM-DD' format
+    team: the team abbreviation (e.g. 'WSH'). If None, data for all teams will be returned.
+    Returns:
+    A DataFrame of statcast data for the date range.
+    """
+    if start_dt is None or end_dt is None:
+        raise ValueError("Both start_dt and end_dt must be provided.")
+    print(f"Pulling data for date range: {start_dt} to {end_dt}.")
+    start_dt, end_dt = _handle_dates(start_dt, end_dt)
+    date_ranges = list(_create_date_ranges(start_dt, end_dt, 1))
+    data_list = []
+    urls = [
+        ROOT_URL
+        + DATE_RANGE.format(
+            start_dt=str(start),
+            end_dt=str(end),
+            team=team if team else "",
+        )
+        for start, end in date_ranges
+    ]
+    schema = None
+    responses = await _fetch_all_data(urls)
+    for data in tqdm(responses, desc="Processing regular data"):
+        # scan csv as lazyframe and drop columns that will always be null
+        data = pl.scan_csv(data)
+        if schema is None:
+            schema = data.collect_schema()
+        else:
+            data = data.cast(schema)
+        data_list.append(data)
+    print("Concatenating data.")
+    df = pl.concat(data_list)
+    print("Data concatenated.")
+    if not extra_stats:
+        print("Done")
+        return df if not return_pandas else df.to_pandas()
+    else:
+        return await _add_extra_stats(df, start_dt, end_dt, return_pandas=return_pandas)
+async def _add_extra_stats(
+    df: pl.LazyFrame, start_dt: dt.date, end_dt: dt.date, return_pandas: bool = False
+) -> pl.LazyFrame | pd.DataFrame:
+    df_list = []
+    urls = [
+        ROOT_URL + EXTRA_STATS.format(pos=pos, start_dt=start_dt, end_dt=end_dt)
+        for pos in ["pitcher", "batter"]
+    ]
+    responses = await _fetch_all_data(urls)
+    for data in tqdm(responses, desc="Processing extra data"):
+        data = pl.scan_csv(data)
+        df_list.append(data)
+    p_df = df_list[0]
+    p_df = p_df.drop("player_name").rename(lambda x: f"{x}_pitcher")
+    b_df = df_list[1]
+    b_df = b_df.drop("player_name").rename(lambda x: f"{x}_batter")
+    print("Joining data.")
+    df = df.join(p_df, left_on="pitcher", right_on="player_id_pitcher", how="left")
+    df = df.join(b_df, left_on="batter", right_on="player_id_batter", how="left")
+    print("Done")
+    return df if not return_pandas else df.to_pandas()
+def _handle_dates(start_dt: str, end_dt: str) -> Tuple[dt.date, dt.date]:
+    """
+    Helper function to handle date inputs.
+    Args:
+    start_dt: the start date in 'YYYY-MM-DD' format
+    end_dt: the end date in 'YYYY-MM-DD' format
+    Returns:
+    A tuple of datetime.date objects for the start and end dates.
+    """
+    start_dt_date = dt.datetime.strptime(start_dt, STATCAST_DATE_FORMAT).date()
+    end_dt_date = dt.datetime.strptime(end_dt, STATCAST_DATE_FORMAT).date()
+    if start_dt_date > end_dt_date:
+        raise ValueError("start_dt must be before end_dt.")
+    return start_dt_date, end_dt_date
+# this function comes from https://github.com/jldbc/pybaseball/blob/master/pybaseball/statcast.py
+def _create_date_ranges(
+    start: dt.date, stop: dt.date, step: int, verbose: bool = True
+) -> Iterator[Tuple[dt.date, dt.date]]:
+    """
+    Iterate over dates. Skip the offseason dates. Returns a pair of dates for beginning and end of each segment.
+    Range is inclusive of the stop date.
+    If verbose is enabled, it will print a message if it skips offseason dates.
+    This version is Statcast specific, relying on skipping predefined dates from STATCAST_VALID_DATES.
+    """
+    low = start
+    while low <= stop:
+        date_span = low.replace(month=3, day=15), low.replace(month=11, day=15)
+        season_start, season_end = YEAR_RANGES.get(low.year, date_span)
+        if low < season_start:
+            low = season_start
+        elif low > season_end:
+            low, _ = YEAR_RANGES.get(
+                low.year + 1, (dt.date(month=3, day=15, year=low.year + 1), None)
+            )
+        if low > stop:
+            return
+        high = min(low + dt.timedelta(step - 1), stop)
+        yield low, high
+        low += dt.timedelta(days=step)

pybaseballstats-0.0.1/pybaseballstats.egg-info/PKG-INFO ADDED Viewed

@@ -0,0 +1,27 @@
+Metadata-Version: 2.2
+Name: pybaseballstats
+Version: 0.0.1
+Summary: A Python package for scraping baseball data.
+Requires-Python: >=3.13
+Description-Content-Type: text/markdown
+Requires-Dist: aiohttp>=3.11.11
+Requires-Dist: asyncio>=3.4.3
+Requires-Dist: bs4>=0.0.2
+Requires-Dist: pandas>=2.2.3
+Requires-Dist: polars>=1.20.0
+Requires-Dist: pytest>=8.3.4
+Requires-Dist: ruff>=0.9.3
+Requires-Dist: setuptools>=75.8.0
+Requires-Dist: tqdm>=4.67.1
+# pybaseballstats
+A Python package for scraping baseball statistics from the web. Inspired by the pybaseball package by James LeDoux. This package is a work in progress and is not yet ready for use.
+## Available Sources
+1. Baseball Savant
+## Usage
+Usage documentation can be found at /usage_docs/

pybaseballstats-0.0.1/pybaseballstats.egg-info/SOURCES.txt ADDED Viewed

@@ -0,0 +1,12 @@
+README.md
+pyproject.toml
+setup.py
+pybaseballstats/__init__.py
+pybaseballstats/fangraphs.py
+pybaseballstats/statcast.py
+pybaseballstats/statcast_utils.py
+pybaseballstats.egg-info/PKG-INFO
+pybaseballstats.egg-info/SOURCES.txt
+pybaseballstats.egg-info/dependency_links.txt
+pybaseballstats.egg-info/requires.txt
+pybaseballstats.egg-info/top_level.txt

pybaseballstats-0.0.1/pybaseballstats.egg-info/dependency_links.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+

pybaseballstats-0.0.1/pybaseballstats.egg-info/requires.txt ADDED Viewed

@@ -0,0 +1,9 @@
+aiohttp>=3.11.11
+asyncio>=3.4.3
+bs4>=0.0.2
+pandas>=2.2.3
+polars>=1.20.0
+pytest>=8.3.4
+ruff>=0.9.3
+setuptools>=75.8.0
+tqdm>=4.67.1

pybaseballstats-0.0.1/pybaseballstats.egg-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ pybaseballstats

pybaseballstats-0.0.1/pyproject.toml ADDED Viewed

@@ -0,0 +1,17 @@
+[project]
+name = "pybaseballstats"
+version = "0.0.1"
+description = "A Python package for scraping baseball data."
+readme = "README.md"
+requires-python = ">=3.13"
+dependencies = [
+    "aiohttp>=3.11.11",
+    "asyncio>=3.4.3",
+    "bs4>=0.0.2",
+    "pandas>=2.2.3",
+    "polars>=1.20.0",
+    "pytest>=8.3.4",
+    "ruff>=0.9.3",
+    "setuptools>=75.8.0",
+    "tqdm>=4.67.1",
+]

pybaseballstats-0.0.1/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0

pybaseballstats-0.0.1/setup.py ADDED Viewed

@@ -0,0 +1,8 @@
+from setuptools import find_packages, setup
+setup(
+    name="pybaseballstats",
+    version="0.0.1",
+    packages=find_packages(include=["pybaseballstats", "pybaseballstats.*"]),
+    # other setup arguments
+)