In [1]:
# converts joined_unfeaturized.csv to joined_unfeaturized_mini.csv
DATA_PATH = "joined_unfeaturized.csv"
import pandas as pd
full_df = pd.read_csv(DATA_PATH, na_values=['-'])
full_df = full_df.where((pd.notnull(full_df)), None)
full_df.head(1)
Out[1]:
In [21]:
lst = []
for i in xrange(len(full_df)):
lst.append((i%10)==0)
mini_df = full_df[pd.Series(lst)]
mini_df.head(3)
Out[21]:
In [22]:
#store joined dataframe into csv.
mini_df.to_csv('joined_unfeaturized_mini.csv', index_label=False)