Source code for sportsreference.nfl.teams

import pandas as pd
import re
from .constants import PARSING_SCHEME, SEASON_PAGE_URL
from pyquery import PyQuery as pq
from ..decorators import float_property_decorator, int_property_decorator
from .. import utils
from .roster import Roster
from .schedule import Schedule


[docs]class Team(object): """ An object containing all of a team's season information. Finds and parses all team stat information and identifiers, such as rank, name, and abbreviation, and sets them as properties which can be directly read from for easy reference. Parameters ---------- team_data : string A string containing all of the rows of stats for a given team. If multiple tables are being referenced, this will be comprised of multiple rows in a single string. rank : int A team's position in the league based on the number of points they obtained during the season. year : string (optional) The requested year to pull stats from. """ def __init__(self, team_data, rank, year=None): self._year = year self._rank = rank self._abbreviation = None self._name = None self._wins = None self._losses = None self._win_percentage = None self._games_played = None self._points_for = None self._points_against = None self._points_difference = None self._margin_of_victory = None self._strength_of_schedule = None self._simple_rating_system = None self._offensive_simple_rating_system = None self._defensive_simple_rating_system = None self._yards = None self._plays = None self._yards_per_play = None self._turnovers = None self._fumbles = None self._first_downs = None self._pass_completions = None self._pass_attempts = None self._pass_yards = None self._pass_touchdowns = None self._interceptions = None self._pass_net_yards_per_attempt = None self._pass_first_downs = None self._rush_attempts = None self._rush_yards = None self._rush_touchdowns = None self._rush_yards_per_attempt = None self._rush_first_downs = None self._penalties = None self._yards_from_penalties = None self._first_downs_from_penalties = None self._percent_drives_with_points = None self._percent_drives_with_turnovers = None self._points_contributed_by_offense = None self._parse_team_data(team_data) def _parse_team_data(self, team_data): """ Parses a value for every attribute. This function looks through every attribute with the exception of '_rank' and retrieves the value according to the parsing scheme and index of the attribute from the passed HTML data. Once the value is retrieved, the attribute's value is updated with the returned result. Note that this method is called directly once Team is invoked and does not need to be called manually. Parameters ---------- team_data : string A string containing all of the rows of stats for a given team. If multiple tables are being referenced, this will be comprised of multiple rows in a single string. """ for field in self.__dict__: # The rank attribute is passed directly to the class during # instantiation. if field == '_rank' or \ field == '_year': continue value = utils._parse_field(PARSING_SCHEME, team_data, str(field)[1:]) setattr(self, field, value) @property def dataframe(self): """ Returns a pandas DataFrame containing all other class properties and values. The index for the DataFrame is the string abbreviation of the team, such as 'KAN'. """ fields_to_include = { 'abbreviation': self.abbreviation, 'defensive_simple_rating_system': self.defensive_simple_rating_system, 'first_downs': self.first_downs, 'first_downs_from_penalties': self.first_downs_from_penalties, 'fumbles': self.fumbles, 'games_played': self.games_played, 'interceptions': self.interceptions, 'losses': self.losses, 'margin_of_victory': self.margin_of_victory, 'name': self.name, 'offensive_simple_rating_system': self.offensive_simple_rating_system, 'pass_attempts': self.pass_attempts, 'pass_completions': self.pass_completions, 'pass_first_downs': self.pass_first_downs, 'pass_net_yards_per_attempt': self.pass_net_yards_per_attempt, 'pass_touchdowns': self.pass_touchdowns, 'pass_yards': self.pass_yards, 'penalties': self.penalties, 'percent_drives_with_points': self.percent_drives_with_points, 'percent_drives_with_turnovers': self.percent_drives_with_turnovers, 'plays': self.plays, 'points_against': self.points_against, 'points_contributed_by_offense': self.points_contributed_by_offense, 'points_difference': self.points_difference, 'points_for': self.points_for, 'rank': self.rank, 'rush_attempts': self.rush_attempts, 'rush_first_downs': self.rush_first_downs, 'rush_touchdowns': self.rush_touchdowns, 'rush_yards': self.rush_yards, 'rush_yards_per_attempt': self.rush_yards_per_attempt, 'simple_rating_system': self.simple_rating_system, 'strength_of_schedule': self.strength_of_schedule, 'turnovers': self.turnovers, 'win_percentage': self.win_percentage, 'wins': self.wins, 'yards': self.yards, 'yards_from_penalties': self.yards_from_penalties, 'yards_per_play': self.yards_per_play } return pd.DataFrame([fields_to_include], index=[self._abbreviation]) @int_property_decorator def rank(self): """ Returns an ``int`` of the team's rank based on the number of points they scored during the season. """ return self._rank @property def abbreviation(self): """ Returns a ``string`` of team's abbreviation, such as 'KAN' for the Kansas City Chiefs. """ return self._abbreviation @property def schedule(self): """ Returns an instance of the Schedule class containing the team's complete schedule for the season. """ return Schedule(self._abbreviation, self._year) @property def roster(self): """ Returns an instance of the Roster class containing all players for the team during the season with all career stats. """ return Roster(self._abbreviation, self._year) @property def name(self): """ Returns a ``string`` of the team's full name, such as 'Kansas City Chiefs'. """ return self._name @int_property_decorator def wins(self): """ Returns an ``int`` of the number of games the team won during the season. """ return self._wins @int_property_decorator def losses(self): """ Returns an ``int`` of the number of games the team lost during the season. """ return self._losses @float_property_decorator def win_percentage(self): """ Returns a ``float`` of the number of wins divided by the number of games played. Percentage ranges from 0-1. """ return self._win_percentage @int_property_decorator def games_played(self): """ Returns an ``int`` of the number of games played during the season. """ return self._games_played @int_property_decorator def points_for(self): """ Returns an ``int`` of the total number of points scored during the season. """ return self._points_for @int_property_decorator def points_against(self): """ Returns an ``int`` of the total number of points allowed during the season. """ return self._points_against @int_property_decorator def points_difference(self): """ Returns an ``int`` of the difference between the number of points scored and allowed during the season. """ return self._points_difference @float_property_decorator def margin_of_victory(self): """ Returns a ``float`` of the average margin of victory per game. """ return self._margin_of_victory @float_property_decorator def strength_of_schedule(self): """ Returns a ``float`` of the team's strength of schedule. An average difficulty schedule is denoted with a 0.0 and a negative number is comparatively easier than average. """ return self._strength_of_schedule @float_property_decorator def simple_rating_system(self): """ Returns a ``float`` of the team's relative strength based on average margin of victory plus strength of schedule. An average team is denoted with 0.0 and a negative score is a comparatively weaker team. """ return self._simple_rating_system @float_property_decorator def offensive_simple_rating_system(self): """ Returns a ``float`` of the team's offensive strength according to the simple rating system. An average team is denoted with 0.0 and a negative score is a comparatively weaker team. """ return self._offensive_simple_rating_system @float_property_decorator def defensive_simple_rating_system(self): """ Returns a ``float`` of the team's defensive strength according to the simple rating system. An average team is denoted with 0.0 and a negative score is a comparatively weaker team. """ return self._defensive_simple_rating_system @int_property_decorator def yards(self): """ Returns an ``int`` of the total number of yards the team has gained during the season. """ return self._yards @int_property_decorator def plays(self): """ Returns an ``int`` of the total number of offensive plays the team has made during the season. """ return self._plays @float_property_decorator def yards_per_play(self): """ Returns a ``float`` of the average number of yards gained per play during the season. """ return self._yards_per_play @int_property_decorator def turnovers(self): """ Returns an ``int`` of the total number of turnovers the team committed during the season. """ return self._turnovers @int_property_decorator def fumbles(self): """ Returns an ``int`` of the total number of times the team fumbled the ball during the season. """ return self._fumbles @int_property_decorator def first_downs(self): """ Returns an ``int`` of the total number of first downs the team achieved during the season. """ return self._first_downs @int_property_decorator def pass_completions(self): """ Returns an ``int`` of the total number of passes that were completed. """ return self._pass_completions @int_property_decorator def pass_attempts(self): """ Returns an ``int`` of the total number of passes that were attempted. """ return self._pass_attempts @int_property_decorator def pass_yards(self): """ Returns an ``int`` of the total number of yards the team gained from passing. """ return self._pass_yards @int_property_decorator def pass_touchdowns(self): """ Returns an ``int`` of the total number of touchdowns the team has scored from passing. """ return self._pass_touchdowns @int_property_decorator def interceptions(self): """ Returns an ``int`` of the total number of interceptions the team has thrown. """ return self._interceptions @float_property_decorator def pass_net_yards_per_attempt(self): """ Returns a ``float`` of the net yards gained per passing play including sacks. """ return self._pass_net_yards_per_attempt @int_property_decorator def pass_first_downs(self): """ Returns an ``int`` of the number of first downs the team gained from passing plays. """ return self._pass_first_downs @int_property_decorator def rush_attempts(self): """ Returns an ``int`` of the total number of rushing plays that were attempted. """ return self._rush_attempts @int_property_decorator def rush_yards(self): """ Returns an ``int`` of the total number of yards that were gained from rushing plays. """ return self._rush_yards @int_property_decorator def rush_touchdowns(self): """ Returns an ``int`` of the total number of touchdowns from rushing plays. """ return self._rush_touchdowns @float_property_decorator def rush_yards_per_attempt(self): """ Returns a ``float`` of the average number of yards gained per rushing play. """ return self._rush_yards_per_attempt @int_property_decorator def rush_first_downs(self): """ Returns an ``int`` of the total number of first downs gained from rushing plays. """ return self._rush_first_downs @int_property_decorator def penalties(self): """ Returns an ``int`` of the total number of penalties called on the team during the season. """ return self._penalties @int_property_decorator def yards_from_penalties(self): """ Returns an ``int`` of the total number of yards surrendered as a result of penalties called on the team. """ return self._yards_from_penalties @int_property_decorator def first_downs_from_penalties(self): """ Returns an ``int`` of the total number of first downs conceded as a result of penalties called on the team. """ return self._first_downs_from_penalties @float_property_decorator def percent_drives_with_points(self): """ Returns a ``float`` of the percentage of drives that result in points for the offense. Percentage ranges from 0-100. """ return self._percent_drives_with_points @float_property_decorator def percent_drives_with_turnovers(self): """ Returns a ``float`` of the percentage of drives that result in an offensive turnover. Percentage ranges from 0-100. """ return self._percent_drives_with_turnovers @float_property_decorator def points_contributed_by_offense(self): """ Returns a ``float`` of the number of expected points contributed by the offense. """ return self._points_contributed_by_offense
[docs]class Teams: """ A list of all NFL teams and their stats in a given year. Finds and retrieves a list of all NFL teams from www.pro-football-reference.com and creates a Team instance for every team that participated in the league in a given year. The Team class comprises a list of all major stats and a few identifiers for the requested season. Parameters ---------- year : string (optional) The requested year to pull stats from. """ def __init__(self, year=None): self._teams = [] self._retrieve_all_teams(year) def __getitem__(self, abbreviation): """ Return a specified team. Returns a team's instance in the Teams class as specified by the team's abbreviation. Parameters ---------- abbreviation : string An NFL team's three letter abbreviation (ie. 'KAN' for Kansas City Chiefs). Returns ------- Team instance If the requested team can be found, its Team instance is returned. Raises ------ ValueError If the requested team is not present within the Teams list. """ for team in self._teams: if team.abbreviation.upper() == abbreviation.upper(): return team raise ValueError('Team abbreviation %s not found' % abbreviation) def __call__(self, abbreviation): """ Return a specified team. Returns a team's instance in the Teams class as specified by the team's abbreviation. This method is a wrapper for __getitem__. Parameters ---------- abbreviation : string An NFL team's three letter abbreviation (ie. 'KAN' for Kansas City Chiefs). Returns ------- Team instance If the requested team can be found, its Team instance is returned. """ return self.__getitem__(abbreviation) def __repr__(self): """Returns a ``list`` of all NFL teams for the given season.""" return self._teams def __iter__(self): """Returns an iterator of all of the NFL teams for a given season.""" return iter(self.__repr__()) def __len__(self): """Returns the number of NFL teams for a given season.""" return len(self.__repr__()) def _add_stats_data(self, teams_list, team_data_dict): """ Add a team's stats row to a dictionary. Pass table contents and a stats dictionary of all teams to accumulate all stats for each team in a single variable. Parameters ---------- teams_list : generator A generator of all row items in a given table. team_data_dict : {str: {'data': str, 'rank': int}} dictionary A dictionary where every key is the team's abbreviation and every value is another dictionary with a 'data' key which contains the string version of the row data for the matched team, and a 'rank' key which is the rank of the team. Returns ------- dictionary An updated version of the team_data_dict with the passed table row information included. """ # Teams are listed in terms of rank with the first team being #1 rank = 1 for team_data in teams_list: if 'class="thead onecell"' in str(team_data): continue abbr = utils._parse_field(PARSING_SCHEME, team_data, 'abbreviation') try: team_data_dict[abbr]['data'] += team_data except KeyError: team_data_dict[abbr] = {'data': team_data, 'rank': rank} rank += 1 return team_data_dict def _retrieve_all_teams(self, year): """ Find and create Team instances for all teams in the given season. For a given season, parses the specified NFL stats table and finds all requested stats. Each team then has a Team instance created which includes all requested stats and a few identifiers, such as the team's name and abbreviation. All of the individual Team instances are added to a list. Note that this method is called directly once Teams is invoked and does not need to be called manually. Parameters ---------- year : string The requested year to pull stats from. """ team_data_dict = {} if not year: year = utils._find_year_for_season('nfl') doc = pq(SEASON_PAGE_URL % year) teams_list = utils._get_stats_table(doc, 'div#all_team_stats') afc_list = utils._get_stats_table(doc, 'table#AFC') nfc_list = utils._get_stats_table(doc, 'table#NFC') for stats_list in [teams_list, afc_list, nfc_list]: team_data_dict = self._add_stats_data(stats_list, team_data_dict) for team_data in team_data_dict.values(): team = Team(team_data['data'], team_data['rank'], year) self._teams.append(team) @property def dataframes(self): """ Returns a pandas DataFrame where each row is a representation of the Team class. Rows are indexed by the team abbreviation. """ frames = [] for team in self.__iter__(): frames.append(team.dataframe) return pd.concat(frames)