notebook.community

Edit and run



In [2]:

    
import pandas as pd
import numpy as np
from IPython.display import display

df1 = pd.DataFrame({'one':[2,1,1,1],'two':[1,3,2,4],'three':[5,4,3,2]})
df1



In [2]:

    
df1.sort_values(by='two')



In [3]:

    
df1[['one', 'two', 'three']].sort_values(by=['one','two'])



In [4]:

    
df1.sort_values(by=['one','two'])



In [5]:

    
df = pd.DataFrame(np.random.randn(5, 3), 
                  index=['a', 'c', 'e', 'f', 'h'],
                  columns=['one', 'two', 'three'])

display(df)

df2=df
#df2=df.copy()
df2.loc[['a','c','h'],['one']]=np.nan

df



In [6]:

    
df['one'].sum()









    Out[6]:





2.1486985947566177



In [7]:

    
df.mean(0)









    Out[7]:





one      1.074349
two     -0.882074
three    0.332695
dtype: float64



In [8]:

    
df.mean(1)









    Out[8]:





a    0.580118
c   -0.564279
e    0.366245
f   -0.255871
h   -0.480496
dtype: float64



In [9]:

    
display(df)
df.cumsum()



In [10]:

    
display(df)
df.groupby('one').mean()



In [11]:

    
df2= pd.DataFrame(np.random.randn(5, 3), 
                  index=['a', 'c', 'e', 'f', 'h'],
                  columns=['one', 'two', 'three'])
df2['four'] = 'bar'
df2['five'] = df['one'] > 0
df2['timestamp'] = pd.Timestamp('20120101')
display(df2)
df2.loc[['a','c','h'],['one','timestamp']] = np.nan
df2



In [12]:

    
df2.fillna(0)



In [13]:

    
df2.fillna(method='pad')



In [14]:

    
df2.fillna(method='bfill')



In [15]:

    
df2.fillna(df2.mean())



In [16]:

    
df3 = pd.DataFrame({'A': [1, 2.1, np.nan, 4.7, 5.6, 6.8],
                    'B': [.25, np.nan, np.nan, 4, 12.2, 14.4]})
df3.interpolate()



In [7]:

    
sample = pd.DataFrame({'PR':[10,100,40] })
sample['PR'] = sample['PR'].mask(sample['PR'] < 90, np.nan)
sample



In [6]:

    
sample = pd.DataFrame({'PR':[10,100,40] })
sample.loc[sample['PR'] < 90, 'PR'] = np.nan
sample



In [ ]:

	one	two	three
a	-0.688905	1.559642	-0.399407
c	0.368577	-0.901106	-0.227452
e	1.183389	-1.842312	1.757657
f	0.965310	-1.736156	0.003234
h	2.954985	-1.490437	0.529445

	one	two	three
a	NaN	1.559642	-0.399407
c	NaN	-0.901106	-0.227452
e	1.183389	-1.842312	1.757657
f	0.965310	-1.736156	0.003234
h	NaN	-1.490437	0.529445

	one	two	three
a	NaN	1.559642	-0.399407
c	NaN	-0.901106	-0.227452
e	1.183389	-1.842312	1.757657
f	0.965310	-1.736156	0.003234
h	NaN	-1.490437	0.529445

	one	two	three
a	NaN	1.559642	-0.399407
c	NaN	0.658536	-0.626859
e	1.183389	-1.183776	1.130798
f	2.148699	-2.919932	1.134032
h	NaN	-4.410370	1.663477

	one	two	three
a	NaN	1.559642	-0.399407
c	NaN	-0.901106	-0.227452
e	1.183389	-1.842312	1.757657
f	0.965310	-1.736156	0.003234
h	NaN	-1.490437	0.529445

	one	two	three	four	five	timestamp
a	-1.001734	-0.519590	-0.363891	bar	False	2012-01-01
c	-1.179448	-0.409359	1.697587	bar	False	2012-01-01
e	0.762478	-1.229147	0.826560	bar	True	2012-01-01
f	0.367050	-0.346026	-0.531973	bar	True	2012-01-01
h	0.675752	-0.251475	-0.275303	bar	False	2012-01-01

	one	two	three	four	five	timestamp
a	0.000000	-0.519590	-0.363891	bar	False	1970-01-01
c	0.000000	-0.409359	1.697587	bar	False	1970-01-01
e	0.762478	-1.229147	0.826560	bar	True	2012-01-01
f	0.367050	-0.346026	-0.531973	bar	True	2012-01-01
h	0.000000	-0.251475	-0.275303	bar	False	1970-01-01

	one	two	three	four	five	timestamp
a	0.564764	-0.519590	-0.363891	bar	False	NaT
c	0.564764	-0.409359	1.697587	bar	False	NaT
e	0.762478	-1.229147	0.826560	bar	True	2012-01-01
f	0.367050	-0.346026	-0.531973	bar	True	2012-01-01
h	0.564764	-0.251475	-0.275303	bar	False	NaT