In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline
In [2]:
leaderboard = pd.read_csv('transfer-learning-on-stack-exchange-tags-publicleaderboard.csv')
leaderboard.sample(4)
Out[2]:
In [12]:
plt.figure(figsize=(14,6))
leaderboard['Score'].hist(bins=50)
plt.xlabel('F1 Score')
Out[12]:
In [4]:
leaderboard[leaderboard.Score > 0.9]
Out[4]:
In [5]:
topByTeam = leaderboard.sort_values('Score', ascending=False).groupby('TeamId').first().reset_index()
In [14]:
plt.figure(figsize=(14,6))
topByTeam.Score.hist(bins=30)
plt.xlabel("F1 Score")
Out[14]:
In [ ]: