In [1]:
from pml.api import *
In [2]:
data = load("../dataset_ext2.csv")
data.fill_missing_with_feature_means()
In [3]:
reduced = pca(data, 2)
In [7]:
clustered = kmeans(reduced, k=2, distance=euclidean)
In [11]:
clustered.calculate_purity()
Out[11]:
In [12]:
data.num_features()
Out[12]:
In [13]:
data.num_samples()
Out[13]:
In [ ]: