In [132]:
import csv
import pandas as pd
import numpy as np
import src.Paths as path
import sys
import os
print(os.getcwd())
print(sys.version_info)
In [133]:
path.trajectories_training_file
Out[133]:
In [134]:
training_files = "../../dataset/training/"
links_file = "links (table 3).csv"
routes_file = "routes (table 4).csv"
trajectories_file = "trajectories(table 5)_training.csv"
volume_file = "volume(table 6)_training.csv"
weather_file = "weather (table 7)_training.csv"
routes_df = pd.read_csv(training_files+routes_file)
links_df = pd.read_csv(training_files+links_file)
weather_df = pd.read_csv(training_files+weather_file)
volume_df = pd.read_csv(training_files+volume_file)
training_files = "../../new_dataset/training/"
trajectories_df = pd.read_csv(training_files+trajectories_file)
In [135]:
routes_df
Out[135]:
In [136]:
from datetime import time
df3 = trajectories_df
df3 = df3.set_index(['intersection_id', 'tollgate_id', 'vehicle_id'])
df3['starting_time'] = pd.to_datetime(df3['starting_time'])
df3 = df3[df3['starting_time'].dt.dayofweek == 1]
df3 = df3[(df3['starting_time'].dt.hour >= 14) & (df3['starting_time'].dt.hour <= 14) &
(df3['starting_time'].dt.minute >= 49) & (df3['starting_time'].dt.minute <= 50)]
print( len(df3))
df3
Out[136]: