In [ ]:
import blaze as bz
import pandas as pd
import numpy as np
from into import into
from bokeh.plotting import *
In [ ]:
output_notebook()
In [ ]:
db = bz.Data('sqlite:///../lahman2013.sqlite')
db.dshape
In [ ]:
list(db.Salaries.teamID.distinct())
In [ ]:
r = bz.compute(db.Salaries["teamID"].distinct())
into(pd.DataFrame, r)
In [ ]:
result = bz.by(db.Salaries.teamID, avg=db.Salaries.salary.mean(),
max=db.Salaries.salary.max(),
ratio=db.Salaries.salary.max() / db.Salaries.salary.min()
).sort('ratio', ascending=False)
df = into(pd.DataFrame, result)
In [ ]:
df
In [ ]:
df = df.sort('avg')
source = ColumnDataSource(df)
p = figure(x_range=list(df["teamID"]))
p.scatter(x="teamID", y="avg", source=source)
show(p)
In [ ]:
df = df.sort('avg')
source = ColumnDataSource(df)
p = figure(x_range=list(df["teamID"]))
p.scatter(x="teamID", y="avg", source=source)
p.xaxis.major_label_orientation = np.pi/3
show(p)
In [ ]:
df = df.sort('avg')
source = ColumnDataSource(df)
s1 = figure(x_range=list(df["teamID"]))
s1.scatter(x="teamID", y="avg", source=source)
s1.xaxis.major_label_orientation = np.pi/3
s2 = figure(x_range=list(df["teamID"]))
s2.scatter(x="teamID", y="ratio", source=source)
s2.xaxis.major_label_orientation = np.pi/3
p = gridplot([[s1, s2]])
show(p)
In [ ]:
TOOLS = "pan,wheel_zoom,box_zoom,reset,save,box_select,lasso_select"
df = df.sort('avg')
source = ColumnDataSource(df)
s1 = figure(x_range=list(df["teamID"]), tools=TOOLS)
s1.scatter(x="teamID", y="avg", source=source)
s1.xaxis.major_label_orientation = np.pi/3
s2 = figure(x_range=list(df["teamID"]), tools=TOOLS)
s2.scatter(x="teamID", y="ratio", source=source)
s2.xaxis.major_label_orientation = np.pi/3
p = gridplot([[s1],[s2]])
show(p)
In [ ]:
db.Salaries.dshape
In [ ]:
db.Salaries[db.Salaries.yearID == 2012]
In [ ]:
#r = bz.compute(db.Salaries[db.Salaries.yearID == 2012])
#df = into(pd.DataFrame, r)
df = into(pd.DataFrame, db.Salaries)
df = df[df["teamID"] == "LAA"]
df = df[df["yearID"] == 2012]
df
In [ ]:
TOOLS = "pan,wheel_zoom,box_zoom,reset,save,box_select,lasso_select"
source = ColumnDataSource(df)
p = figure(x_range=list(df["playerID"]), tools=TOOLS)
p.scatter(x="playerID", y="salary", source=source)
p.xaxis.major_label_orientation = np.pi/3
show(p)
In [ ]:
TOOLS = "pan,wheel_zoom,box_zoom,reset,save,box_select,lasso_select"
df = df.sort('salary')
source = ColumnDataSource(df)
p = figure(x_range=list(df["playerID"]), tools=TOOLS)
p.scatter(x="playerID", y="salary", source=source)
p.xaxis.major_label_orientation = np.pi/3
show(p)
In [ ]: