In [1]:
import pandas as pd
import numpy as np
In [11]:
df.head()
Out[11]:
In [40]:
Dfg.head()
Out[40]:
In [38]:
sum(df[j].values==25)
Dfg = pd.DataFrame(columns=df.columns.values , index= df.columns.values)
In [54]:
for o in Dfg.columns.values :
for k in Dfg.columns.values :
if Dfg.loc[o,k] == 1 :
print o , k , Dfg.loc[o,k]
In [52]:
#df = df.drop('ACTION' , axis = 1 )
for i in df.columns.values :
print i
for j in df.columns.values :
if i != j :
print "=========="
count = df[j].value_counts()
x= df.groupby(i)[j].apply(lambda f : len(np.unique(f)))
Dfg.ix[i,j] = x.quantile(0.98)
In [9]:
df[j].value_counts().index[]
Out[9]:
In [15]:
print x
In [ ]: