In [1]:
import pandas as pd
import numpy as np

In [6]:
def off_win(row, games_df):
    score = games_df.iloc[row.loc['gid'] - 1]

    if row['off'] == score['h']:

        if score.ptsh > score.ptsv:
            return 1
        else:
            return 0


    elif row['off'] == score['v']:

        if score.ptsv > score.ptsh:
            return 1

        else:
            return 0

    else:
        raise Exception('Teams do not match: %s vs. %s; %s vs. %s' % (
            row['off'], row['def'], score['v'], score['h']))

In [7]:
plays_df = pd.read_csv('../data/raw/PLAY.csv')
games_df = pd.read_csv('../data/raw/GAME.csv')

In [8]:
plays_df = plays_df.loc[:, [
    'gid',
    'off',
    'def',
    'qtr',
    'min',
    'sec',
    'ptso',
    'ptsd',
    'timo',
    'timd',
    'dwn',
    'ytg',
    'yfog'
]]

In [10]:
plays_df['y'] = plays_df.apply(lambda row: off_win(row, games_df), axis=1)
plays_df.to_csv('../data/Xy.csv')

In [ ]: