Ejemplo n.º 1
0
def get_player_rosters(league,
                       season,
                       results_array=None,
                       multiple_teams=False):
    league = str(league)
    season = str(season)

    if results_array is None:
        results_array = []
    player_ids = []
    team_urls = []
    """ Get the league link """

    team_search_url = "http://www.eliteprospects.com/standings.php?league={0}&startdate={1}".format(
        league, str(int(season) - 1))
    team_search_request = requests.get(team_search_url)

    # All tag names have this prepended to them
    html_prefix = '{http://www.w3.org/1999/xhtml}'
    team_search_page = html5lib.parse(team_search_request.text)
    team_table = team_search_page.find(
        './/*[@id="standings"]/{0}div/{0}div[3]/{0}table'.replace(
            '{0}', html_prefix))

    teams_by_conference = helpers.get_ep_table_rows(team_table)

    for conference in teams_by_conference:
        for team in conference:
            team_url: str = team.find(
                './/{0}td[2]/{0}span/{0}a'.format(html_prefix)).attrib['href']
            if re.compile('/\d{4}-\d{4}$').search(team_url):
                team_url = team_url[:team_url.rfind('/')]
            if team_url.endswith('/'):
                team_url = team_url[:-1]
            team_urls.append("{}/{}-{}".format(team_url,
                                               int(season) - 1, season))
    """ Get the players """

    for team_url in team_urls:
        teamroster.get_team_roster(team_url, season, league, player_ids,
                                   results_array, multiple_teams)

    return results_array
Ejemplo n.º 2
0
def get_player_rosters(league, season, results_array=None, multiple_teams=False):
    league = str(league)
    season = str(season)

    if results_array is None:
        results_array = []
    player_ids = []
    team_urls = []

    """ Get the league link """

    team_search_url = "http://www.eliteprospects.com/standings.php?league={0}&startdate={1}".format(league, str(int(season) - 1))
    team_search_request = requests.get(team_search_url)

    # All tag names have this prepended to them
    html_prefix = '{http://www.w3.org/1999/xhtml}'
    team_search_page = html5lib.parse(team_search_request.text)
    # /html/body/div/table[3]/tbody/tr/td[5]/table[3]
    team_table = team_search_page.find(
        './{0}body/{0}div/{0}table[3]/{0}tbody/{0}tr/{0}td[5]/{0}table[3]'.format(html_prefix))

    teams = team_table.findall('.//{0}tbody/{0}tr/{0}td[2]/{0}a'.format(html_prefix))

    on_first_row = True

    for team in teams:
        if on_first_row:
            on_first_row = False
            continue
        team_urls.append(team.attrib['href'])

    """ Get the players """

    for team_url in team_urls:
        teamroster.get_team_roster(team_url, season, player_ids, results_array, multiple_teams, league)

    return results_array
Ejemplo n.º 3
0
def main():
    arg_parser = argparse.ArgumentParser(description="Get prospect data from any league on the planet over a range of seasons")
    arg_parser.add_argument('--roster', action='store_true', help="Output roster list for the given league(s) and season(s)")
    arg_parser.add_argument('--team_roster', action='store_true', help="Output roster list for the given team and season(s)")
    arg_parser.add_argument('--stats', action='store_true', help="Output stats list for the given league(s) and season(s)")
    arg_parser.add_argument('--standings', action='store_true', help="All teams in league, with goals for/against")
    arg_parser.add_argument('--multiple_teams', action='store_true', help="Whether to show all teams a player has played for")
    arg_parser.add_argument('leagues', type=helpers.comma_delimited_list, help="Comma-delimited list (no spaces) of leagues")
    arg_parser.add_argument('start_season', type=int, help="Earliest season for which to scrape data. Second year of the season (i.e. passing 2014 refers to the 2013-14 season)")
    arg_parser.add_argument('--range', type=int, help="Choose the latest season to parse to parse many seasons at once. Second year of the season (i.e. passing 2014 refers to the 2013-14 season)", required=False)

    args = arg_parser.parse_args()

    start_season = args.start_season
    end_season = args.range if args.range is not None else args.start_season
    multiple_teams = args.multiple_teams

    if args.roster:
        results_array = []

        for league in args.leagues:
            for season in range(start_season, end_season + 1):
                try:
                    roster.get_player_rosters(league, season, results_array, multiple_teams)
                except Exception as e:
                    print('Error in {0} {1}'.format(league, season))
                    print(e)

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_rosters.csv'.format(start_season, end_season, '-'.join(args.leagues)))

    if args.team_roster:
        results_array = []

        # When running team_rosters, the 'leagues' argument is actually teams

        for league in args.leagues:
            for season in range(start_season, end_season + 1):
                try:
                    teamroster.get_team_roster('team.php?team={0}&year0={1}'.format(league, season), season, results_array=results_array)
                except Exception as e:
                    print('Error in {0} {1}'.format(league, season))
                    print(e)

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_team_rosters.csv'.format(start_season, end_season, '-'.join(args.leagues)))

    if args.stats:
        results_array = []

        for league in args.leagues:
            for season in range(start_season, end_season + 1):
                try:
                    stats.get_player_stats(league, season, results_array, multiple_teams)
                except Exception as e:
                    print('Error in {0} {1}'.format(league, season))
                    print(e)

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_stats.csv'.format(start_season, end_season, '-'.join(args.leagues)))

    if args.standings:
        results_array = []

        for league in args.leagues:
            for season in range(start_season, end_season + 1):
                try:
                    standings.get_league_standings(league, season, results_array)
                except Exception as e:
                    print('Error in {0} {1}'.format(league, season))
                    print(e)

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_standings.csv'.format(start_season, end_season, '-'.join(args.leagues)))

    print("Success!")
Ejemplo n.º 4
0
def main():
    arg_parser = argparse.ArgumentParser(
        description="Get prospect data from any league on the planet over a range of seasons")
    arg_parser.add_argument('--roster', action='store_true',
                            help="Output roster list for the given league(s) and season(s)")
    arg_parser.add_argument('--team_roster', type=str,
                            help="Output roster list for the given team and season(s)")
    arg_parser.add_argument('--stats', action='store_true',
                            help="Output stats list for the given league(s) and season(s)")
    arg_parser.add_argument('--team_stats', type=str,
                            help="Output stats list for the given team and season(s)")
    arg_parser.add_argument('--playoffs', action='store_true',
                            help="Use playoff instead of regular season stats")
    arg_parser.add_argument('--standings', action='store_true',
                            help="All teams in league, with goals for/against")
    arg_parser.add_argument(
        '--icetime', action='store_true', help="NHL icetime for season")
    arg_parser.add_argument('--multiple_teams', action='store_true',
                            help="Whether to show all teams a player has played for")
    arg_parser.add_argument('leagues', type=helpers.comma_delimited_list,
                            help="Comma-delimited list (no spaces) of leagues")
    arg_parser.add_argument('start_season', type=int,
                            help="Earliest season for which to scrape data. Second year of the season (i.e. passing 2014 refers to the 2013-14 season)")
    arg_parser.add_argument(
        '--range', type=int, help="Choose the latest season to parse to parse many seasons at once. Second year of the season (i.e. passing 2014 refers to the 2013-14 season)", required=False)

    args = arg_parser.parse_args()

    start_season = args.start_season
    end_season = args.range if args.range is not None else args.start_season
    multiple_teams = args.multiple_teams
    playoffs = args.playoffs

    if args.icetime:
        if len(args.leagues) is not 1 or args.leagues[0].lower() != "nhl":
            print("Error: Icetime is currently only supported for the NHL")
            return

        results_array = []

        for season in range(start_season, end_season + 1):
            icetime.get_nhl_season_icetime(season, results_array)

        helpers.export_array_to_csv(
            results_array, '{0}-{1}_{2}_icetime.csv'.format(start_season, end_season, 'nhl'))

    if args.roster:
        results_array = []

        for league in args.leagues:
            for season in range(start_season, end_season + 1):
                roster.get_player_rosters(league, season, results_array, multiple_teams)

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_rosters.csv'.format(
            start_season, end_season, '-'.join(args.leagues)))

    if args.team_roster is not None:
        results_array = []

        if len(args.leagues) != 1:
            print(
                'Error: must supply a single league for the team you wish to fetch the roster of')
        else:
            league = args.leagues[0]
            for season in range(start_season, end_season + 1):
                teamroster.get_team_roster('https://eliteprospects.com/team.php?team={0}&year0={1}'.format(
                    args.team_roster, season), season, league, results_array=results_array)

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_team_rosters.csv'.format(
            start_season, end_season, '-'.join(args.leagues)))

    if args.team_stats is not None:
        results_array = []
        goalie_results_array = []

        if len(args.leagues) != 1:
            print(
                'Error: must supply a single league for the team you wish to fetch stats for')
        else:
            league = args.leagues[0]
            for season in range(start_season, end_season + 1):
                team_stats.get_player_stats(
                    'https://www.eliteprospects.com/team/{}/{}-{}?tab=stats#players'.format(
                        args.team_stats,
                        int(season) - 1,
                        season
                    ),
                    season,
                    league,
                    results_array=results_array,
                    goalie_results_array=goalie_results_array
                )

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_team_stats.csv'.format(
            start_season, end_season, '-'.join(args.leagues)))
        helpers.export_array_to_csv(goalie_results_array, '{0}-{1}_{2}_team_goalie_stats.csv'.format(
            start_season, end_season, '-'.join(args.leagues)))

    if args.stats:
        results_array = []
        goalie_results_array = []

        for league in args.leagues:
            for season in range(start_season, end_season + 1):
                stats.get_player_stats(
                    league, season, results_array, goalie_results_array)

        helpers.export_array_to_csv(
            results_array,
            '{0}-{1}_{2}{3}_stats.csv'.format(start_season, end_season, '-'.join(
                args.leagues), '_playoff' if playoffs else '')
        )
        helpers.export_array_to_csv(
            goalie_results_array,
            '{0}-{1}_{2}{3}_goalie_stats.csv'.format(start_season, end_season, '-'.join(
                args.leagues), '_playoff' if playoffs else '')
        )

    if args.standings:
        results_array = []

        for league in args.leagues:
            for season in range(start_season, end_season + 1):
                standings.get_league_standings(
                    league, season, results_array)

        helpers.export_array_to_csv(results_array, '{0}-{1}_{2}_standings.csv'.format(
            start_season, end_season, '-'.join(args.leagues)))

    print("Success!")