In [2]:
train = pd.read_csv('train.csv')
test = pd.read_csv('test.csv')
sample = pd.read_csv('sampleSubmission.csv')
In [7]:
train.head(2)
Out[7]:
In [8]:
test.head(2)
Out[8]:
In [6]:
sample.head(2)
Out[6]:
In [5]:
gps = pd.read_csv('metaData_taxistandsID_name_GPSlocation.csv')
In [10]:
print gps[:5]
In [4]:
import pandas as pd
In [11]:
# 머신러닝을 쓰지말고 가까운데만 계산해서 제출해보자
test = pd.read_csv('test.csv')
gps = pd.read_csv('metaData_taxistandsID_name_GPSlocation.csv')
In [15]:
tmp = test.POLYLINE[0]
print eval(tmp)
print eval(tmp)[-1]
In [22]:
test = pd.read_csv('test.csv', usecols=['POLYLINE','TRIP_ID'],
converters={'POLYLINE': lambda x: eval(x)[-1]})
In [19]:
print test.head(2)
print test.POLYLINE[0][0]
In [23]:
test['LONGITUDE'] = test.POLYLINE.apply(lambda x: x[0])
test['LATITUDE'] = test.POLYLINE.apply(lambda x: x[1])
# Create your submission file
submission = pd.DataFrame({"TRIP_ID": test['TRIP_ID'], "LONGITUDE" : test['LONGITUDE'], "LATITUDE" : test['LATITUDE']})
submission.to_csv("submission.csv", index=False)
In [25]:
# kaggle LB
# 3.31766 211/326
In [27]:
pwd
Out[27]: