In [1]:
import pandas as pd
In [2]:
df1 = pd.read_csv('../resource/raw_df1.csv')
df2 = pd.read_csv('../resource/raw_df2.csv')
df3 = pd.read_csv('../resource/lee_df.csv')
In [3]:
df1.tail(1)
Out[3]:
In [4]:
df2.tail(1)
Out[4]:
In [5]:
df3.tail(1)
Out[5]:
1. 이동진 평점 및 코멘트만 불러오기 (new_df3)
In [6]:
lee = df3['name'] == '이동진 평론가'
lee
Out[6]:
In [7]:
lee_df = df3[lee]
In [8]:
new_df3 = pd.concat([df3, lee_df], axis=1).ix[:,4:]
new_df3
Out[8]:
In [9]:
new_df3.describe()
Out[9]:
In [10]:
preprocess_df1 = pd.concat([df1.ix[:,:3], new_df3.ix[:,:1], df2.ix[:,3:6], df2.ix[:,1:3],
df1.ix[:,4:], df2.ix[:,6:], new_df3.ix[:,1:]], axis=1)
In [11]:
preprocess_df1.tail(1)
Out[11]:
In [12]:
preprocess_df1.to_csv('../resource/preprocess_df1.csv', index=False, encoding='utf8')