In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
In [2]:
# Basic IO
filename = 'clustering/dataset.csv'
dataset = pd.read_csv(filename)
# Randomize Dataset
dataset = dataset.sample(frac=1,random_state=32).reset_index()
dataset.head()
Out[2]:
In [3]:
dataset.drop(['index','y'], axis=1, inplace=True)
dataset.head()
Out[3]:
In [4]:
# Write to Text Data
dataset.to_csv('clustering/synth_all.csv', index=False)