Exemplo n.º 1
0
pa = plays.loc[plays['player'].shift() != plays['player'],
               ['year', 'game_id', 'inning', 'team', 'player']]

## Group Plate Appearances
pa = pa.groupby(['year', 'game_id', 'team']).size().reset_index(name='PA')

## Reshape Data by Event Type Per Plate Appearance by Setting Event Index and Unstacking the Resulting Frame
events = events.set_index(['year', 'game_id', 'team', 'event_type'])
events = events.unstack().fillna(0).reset_index()

## Clean Events Columns Labels
events.columns = events.columns.droplevel()
events.columns = [
    'year', 'game_id', 'team', 'BB', 'E', 'H', 'HBP', 'HR', 'ROE', 'SO'
]
events = events.rename_axis(None, axis='columns')

## Merge Plate Appearances
events_plus_pa = pd.merge(events,
                          pa,
                          how='outer',
                          left_on=['year', 'game_id', 'team'],
                          right_on=['year', 'game_id', 'team'])

## Merge Team
defense = pd.merge(events_plus_pa, info)

## Calculate DER (Defence Efficiency Ratio)
defense.loc[:, 'DER'] = 1 - ((defense['H'] + defense['ROE']) /
                             (defense['PA'] - defense['BB'] - defense['SO'] -
                              defense['HBP'] - defense['HR']))
Exemplo n.º 2
0
import pandas as pd
import matplotlib.pyplot as plt
from frames import games, info, events

plays = games.query("type == 'play' & event != 'NP'")
plays.columns = ["type", "inning", "team", "player", "count", "pitches", "event", "game_id", "year"]

pa = plays.loc[plays["player"].shift() != plays["player"], ["year", "game_id", "inning", "team", "player"]]
pa = pa.groupby(["year", "game_id", "team"]).size().reset_index(name="PA")

events = events.set_index(["year", "game_id", "team", "event_type"])
events = events.unstack().fillna(0).reset_index()
events.columns = events.columns.droplevel()
events.columns = ["year", "game_id", "team", "BB", "E", "H", "HBP", "HR", "ROE","SO"]
events = events.rename_axis("None", axis="columns")

events_plus_pa = pd.merge(events, pa, how="outer", left_on=["year", "game_id", "team"], right_on=["year", "game_id", "team"])
defense = pd.merge(events_plus_pa, info)

defense.loc[:, "DER"] = 1 - ((defense["H"] + defense["ROE"]) / (defense["PA"] - defense["BB"] - defense["SO"] - defense["HBP"] - defense["HR"]))
defense.loc[:, "year"] = pd.to_numeric(defense["year"])

der = defense.loc[defense["year"] >= 1978, ["year", "defense", "DER"]]
der = der.pivot(index="year", columns="defense", values="DER")

der.plot(x_compat=True, xticks=range(1978, 2018, 4), rot=45)

plt.savefig("defense.png")

plt.show()
Exemplo n.º 3
0
plays.columns = [
    'type', 'inning', 'team', 'player', 'count', 'pitches', 'event', 'game_id',
    'year'
]
pa = plays.loc[plays['player'].shift() != plays['player'],
               ['year', 'game_id', 'inning', 'team', 'player']]
pa = pa.groupby(['year', 'game_id', 'team']).size().reset_index(name='PA')
# print(pa)

events = events.set_index(['year', 'game_id', 'team', 'event_type'])
events = events.unstack().fillna(0).reset_index()
events.columns = events.columns.droplevel()
events.columns = [
    'year', 'game_id', 'team', 'BB', 'E', 'H', 'HBP', 'HR', 'ROE', 'SO'
]
events = events.rename_axis('None', axis='columns')
# print(events)
events_plus_pa = pd.merge(events,
                          pa,
                          how='outer',
                          left_on=['year', 'game_id', 'team'],
                          right_on=['year', 'game_id', 'team'])
defense = pd.merge(events_plus_pa, info)
defense.loc[:, 'DER'] = 1 - ((defense["H"] + defense["ROE"]) /
                             (defense["PA"] - defense["BB"] - defense["SO"] -
                              defense["HBP"] - defense["HR"]))
defense.loc[:, 'year'] = pd.to_numeric(defense.loc[:, 'year'])
der = defense.loc[defense['year'] >= 1978, ['year', 'defense', 'DER']]
der = der.pivot(index='year', columns='defense', values='DER')
# print(der)
der.plot(x_compat=True, xticks=range(1978, 2018, 4), rot=45)
Exemplo n.º 4
0
pa = pa.groupby(["year", "game_id", "team"]).size().reset_index(name="PA")

events = events.set_index(["year", "game_id", "team", "event_type"])
print(events.info())
print(events.head())
events = events.unstack().fillna(0).reset_index()

print(events.info())
print(events.head())

events.columns = events.columns.droplevel()
events.columns = [
    "year", "game_id", "team", "BB", "E", "H", "HBP", "HR", "ROE", "SO"
]
events = events.rename_axis(None, axis="columns")
print(events.head())

events_plus_pa = pd.merge(events,
                          pa,
                          how="outer",
                          left_on=['year', 'game_id', 'team'],
                          right_on=['year', 'game_id', 'team'])
print(events_plus_pa.head())
print(info.info())
print(info.head())
defense = pd.merge(events_plus_pa, info)
defense.loc[:, 'DER'] = 1 - ((defense["H"] + defense["ROE"]) /
                             (defense["PA"] - defense["BB"] - defense["SO"] -
                              defense["HBP"] - defense["HR"]))
defense.loc[:, "year"] = pd.to_numeric(defense.loc[:, "year"])
plays = games.query('type == "play" and event != "NP"')
plays.columns = [
    'type', 'inning', 'team', 'player', 'count', 'pitches', 'event', 'game_id',
    'year'
]
pa = plays.loc[plays['player'].shift() != plays['player'],
               ['year', 'game_id', 'inning', 'team', 'player']]
pa = pa.groupby(['year', 'game_id', 'team']).size().reset_index(name='PA')
events = events.set_index(['year', 'game_id', 'team', 'event_type'])
events = events.unstack().fillna(0).reset_index()
events.columns = events.columns.droplevel()
events.columns = [
    'year', 'game_id', 'team', 'BB', 'E', 'H', 'HBP', 'HR', 'ROE', 'SO'
]
events = events.rename_axis('None', axis="columns")
events_plus_pa = pd.merge(events,
                          pa,
                          how="outer",
                          left_on=['year', 'game_id', 'team'],
                          right_on=['year', 'game_id', 'team'])
defense = pd.merge(events_plus_pa, info)
defense.loc[:, 'DER'] = 1 - ((defense['H'] + defense['ROE']) /
                             (defense['PA'] - defense['BB'] - defense['SO'] -
                              defense['HBP'] - defense['HR']))
defense.loc[:, 'year'] = pd.to_numeric(defense.loc[:, 'year'])
der = defense.loc[defense['year'] >= 1978, ['year', 'defense', 'DER']]
der = der.pivot(index='year', columns='defense', values='DER')
der.plot(x_compat=True, xticks=range(1978, 2018, 4), rot=45)
plt.show()