In [12]:
from pml.api import *
import pandas as pd
import matplotlib.pyplot as plt
In [2]:
data = load("../dataset_ext2.csv")
data = data.drop_empty_samples()
data.fill_missing_with_feature_means()
In [3]:
data.get_label_value_counts()
Out[3]:
In [13]:
# Get first principal component
princomp = pca(data, 1)
signed_weights = pd.Series(princomp.weights[:, 0],
index=princomp._original_features)
In [15]:
print signed_weights.order(ascending=False)
In [17]:
min_weight = signed_weights.min()
max_weight = signed_weights.max()
print min_weight, max_weight
In [21]:
normalized_weights = ((signed_weights - min_weight)
/ (max_weight - min_weight))
print normalized_weights.order(ascending=False)
In [ ]: