In [1]:
csvfile = "GENdata.csv"

In [2]:
csvfile


Out[2]:
'GENdata.csv'

In [7]:
gendata = open(csvfile, 'r')

In [8]:
gendata


Out[8]:
<_io.TextIOWrapper name='GENdata.csv' mode='r' encoding='UTF-8'>

In [9]:
memdata = gendata.read()

In [10]:
memdata


Out[10]:
'PatientID,GeneticMarker,TestGroup\n1234,sep13,A\n2345,oct14,B\n98754,nov12,A\n323424,mar02,B\n'

In [15]:
print(memdata)


PatientID,GeneticMarker,TestGroup
1234,sep13,A
2345,oct14,B
98754,nov12,A
323424,mar02,B


In [16]:
import pandas as pd

In [21]:
csvdf = pd.read_csv(csvfile)

In [22]:
csvdf


Out[22]:
PatientID GeneticMarker TestGroup
0 1234 sep13 A
1 2345 oct14 B
2 98754 nov12 A
3 323424 mar02 B

In [25]:
csvdf.TestGroup.astype('category')


Out[25]:
0    A
1    B
2    A
3    B
Name: TestGroup, dtype: category
Categories (2, object): [A, B]

In [31]:
csvdf.describe


Out[31]:
<bound method NDFrame.describe of    PatientID GeneticMarker TestGroup
0       1234         sep13         A
1       2345         oct14         B
2      98754         nov12         A
3     323424         mar02         B>

In [ ]: