In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

Pandas kütüphanesi ile veri yükleme

  • Data frame'e veri aktaracağız

In [43]:
df = pd.read_csv('people-example.csv')

In [44]:
df


Out[44]:
First Name Last Name Country age
0 Bob Smith United States 24
1 Alice Williams Canada 23
2 Malcolm Jone England 22
3 Felix Brown USA 23
4 Alex Cooper NaN 23
5 Tod Campbell United States 22
6 Derek Ward Switzerland 25
7 Leyla Doğan NaN 8
8 Nusret Barış Doğan Turkey 5
9 Efe Deniz Turkey 13
10 Çağla Karaali Turkey 39

In [45]:
# Son satirlara bak
df.tail()


Out[45]:
First Name Last Name Country age
6 Derek Ward Switzerland 25
7 Leyla Doğan NaN 8
8 Nusret Barış Doğan Turkey 5
9 Efe Deniz Turkey 13
10 Çağla Karaali Turkey 39

In [46]:
print(df)


      First Name Last Name        Country  age
0            Bob     Smith  United States   24
1          Alice  Williams         Canada   23
2        Malcolm      Jone        England   22
3          Felix     Brown            USA   23
4           Alex    Cooper            NaN   23
5            Tod  Campbell  United States   22
6          Derek      Ward    Switzerland   25
7          Leyla     Doğan            NaN    8
8   Nusret Barış     Doğan         Turkey    5
9            Efe     Deniz         Turkey   13
10         Çağla   Karaali         Turkey   39

In [9]:
type(df)


Out[9]:
pandas.core.frame.DataFrame

In [10]:
df.fillna('Missing')


Out[10]:
First Name Last Name Country age
0 Bob Smith United States 24
1 Alice Williams Canada 23
2 Malcolm Jone England 22
3 Felix Brown USA 23
4 Alex Cooper Missing 23
5 Tod Campbell United States 22
6 Derek Ward Switzerland 25
7 Leyla Doğan Missing 8
8 Nusret Barış Doğan Turkey 5
9 Efe Deniz Turkey 13
10 Çağla Karaali Turkey 39

In [49]:
df = df.fillna('Missing')

In [12]:
df


Out[12]:
First Name Last Name Country age
0 Bob Smith United States 24
1 Alice Williams Canada 23
2 Malcolm Jone England 22
3 Felix Brown USA 23
4 Alex Cooper Missing 23
5 Tod Campbell United States 22
6 Derek Ward Switzerland 25
7 Leyla Doğan Missing 8
8 Nusret Barış Doğan Turkey 5
9 Efe Deniz Turkey 13
10 Çağla Karaali Turkey 39

In [13]:
df.dtypes


Out[13]:
First Name    object
Last Name     object
Country       object
age            int64
dtype: object

In [14]:
df[:3]


Out[14]:
First Name Last Name Country age
0 Bob Smith United States 24
1 Alice Williams Canada 23
2 Malcolm Jone England 22

In [17]:
df[:5]


Out[17]:
First Name Last Name Country age
0 Bob Smith United States 24
1 Alice Williams Canada 23
2 Malcolm Jone England 22
3 Felix Brown USA 23
4 Alex Cooper Missing 23

In [23]:
ages = df[['age']]

In [24]:
type(ages)


Out[24]:
pandas.core.frame.DataFrame

In [25]:
ages.max()


Out[25]:
age    39
dtype: int64

In [26]:
ages.mean()


Out[26]:
age    20.636364
dtype: float64

In [27]:
ages.median()


Out[27]:
age    23.0
dtype: float64

In [31]:
ages.hist()


Out[31]:
array([[<matplotlib.axes._subplots.AxesSubplot object at 0x112f42710>]], dtype=object)

In [32]:
ages*ages


Out[32]:
age
0 576
1 529
2 484
3 529
4 529
5 484
6 625
7 64
8 25
9 169
10 1521

In [33]:
df['Country']


Out[33]:
0     United States
1            Canada
2           England
3               USA
4           Missing
5     United States
6       Switzerland
7           Missing
8            Turkey
9            Turkey
10           Turkey
Name: Country, dtype: object

In [34]:
def change_country(ulke):
    if ulke == 'USA':
        return 'United States'
    return ulke

In [39]:
change_country('USA')


Out[39]:
'United States'

In [38]:
change_country('Türkiye')


Out[38]:
'Türkiye'

In [47]:
df['Country'] = df['Country'].apply(change_country)

In [50]:
df


Out[50]:
First Name Last Name Country age
0 Bob Smith United States 24
1 Alice Williams Canada 23
2 Malcolm Jone England 22
3 Felix Brown United States 23
4 Alex Cooper Missing 23
5 Tod Campbell United States 22
6 Derek Ward Switzerland 25
7 Leyla Doğan Missing 8
8 Nusret Barış Doğan Turkey 5
9 Efe Deniz Turkey 13
10 Çağla Karaali Turkey 39

In [51]:
df['Full Name'] = df['First Name'] + ' ' + df['Last Name']

In [52]:
df


Out[52]:
First Name Last Name Country age Full Name
0 Bob Smith United States 24 Bob Smith
1 Alice Williams Canada 23 Alice Williams
2 Malcolm Jone England 22 Malcolm Jone
3 Felix Brown United States 23 Felix Brown
4 Alex Cooper Missing 23 Alex Cooper
5 Tod Campbell United States 22 Tod Campbell
6 Derek Ward Switzerland 25 Derek Ward
7 Leyla Doğan Missing 8 Leyla Doğan
8 Nusret Barış Doğan Turkey 5 Nusret Barış Doğan
9 Efe Deniz Turkey 13 Efe Deniz
10 Çağla Karaali Turkey 39 Çağla Karaali

In [55]:
df


Out[55]:
First Name Last Name Country age Full Name
0 Bob Smith United States 24 Bob Smith
1 Alice Williams Canada 23 Alice Williams
2 Malcolm Jone England 22 Malcolm Jone
3 Felix Brown United States 23 Felix Brown
4 Alex Cooper Missing 23 Alex Cooper
5 Tod Campbell United States 22 Tod Campbell
6 Derek Ward Switzerland 25 Derek Ward
7 Leyla Doğan Missing 8 Leyla Doğan
8 Nusret Barış Doğan Turkey 5 Nusret Barış Doğan
9 Efe Deniz Turkey 13 Efe Deniz
10 Çağla Karaali Turkey 39 Çağla Karaali

In [56]:
backup = df

In [57]:
df = df.drop('age', 1)

In [58]:
df


Out[58]:
First Name Last Name Country Full Name
0 Bob Smith United States Bob Smith
1 Alice Williams Canada Alice Williams
2 Malcolm Jone England Malcolm Jone
3 Felix Brown United States Felix Brown
4 Alex Cooper Missing Alex Cooper
5 Tod Campbell United States Tod Campbell
6 Derek Ward Switzerland Derek Ward
7 Leyla Doğan Missing Leyla Doğan
8 Nusret Barış Doğan Turkey Nusret Barış Doğan
9 Efe Deniz Turkey Efe Deniz
10 Çağla Karaali Turkey Çağla Karaali

In [ ]: