In [1]:
import numpy as np
import pandas as pd
from pandas import DataFrame,Series
In [2]:
df = DataFrame({'key1':['A']*2 + ['B']*3,
'key2':[2,2,2,3,3]})
df
Out[2]:
In [3]:
df.duplicated()
Out[3]:
In [5]:
df.drop_duplicates()
Out[5]:
In [7]:
# keeps first value found
df.drop_duplicates(['key1'])
Out[7]:
In [8]:
# keeps last value found
df.drop_duplicates(['key1'],take_last=True)
Out[8]:
In [9]:
df.drop_duplicates(['key1'],keep='last')
Out[9]:
In [ ]: