In [1]:
import pandas as pd
In [2]:
df = pd.DataFrame({'s': ['X,Y,Z', 'X', 'XY,Y', 'Y,Z,XY']},
index=['a', 'b', 'c', 'd'])
In [3]:
print(df)
In [4]:
df['l'] = df['s'].str.split(',')
print(df)
In [5]:
print(df.dtypes)
In [6]:
print(type(df.at['a', 's']))
In [7]:
print(type(df.at['a', 'l']))
In [8]:
print(df['s'].apply(lambda x: [s.strip() for s in x.split(',')]))
In [9]:
print(df['l'].apply(len))
In [10]:
print(df['l'].apply(sorted))
In [11]:
print(df['l'].apply(lambda x: ','.join(x)))
In [12]:
print(df['l'].apply(','.join))
In [13]:
print(df['l'].apply(lambda x: ','.join(sorted(x))))
In [14]:
df['l'].apply(lambda x: x.append('A'))
print(df)
In [15]:
df['l'].apply(lambda x: x.remove('Z') if 'Z' in x else x)
print(df)
In [16]:
print(df['l'].apply(lambda x: 'X' in x))
In [17]:
print(df[df['l'].apply(lambda x: 'X' in x)])
In [18]:
print(df['s'].str.contains('Z'))
In [19]:
print(df[df['s'].str.contains('Z')])