In [1]:
import csv
import pandas as pd
import numpy as np
import src.Paths as path
import sys
import os
print(os.getcwd())
print(sys.version_info)
In [2]:
path.trajectories_training_file
Out[2]:
In [3]:
training_files = "../../dataset/training/"
links_file = "links (table 3).csv"
routes_file = "routes (table 4).csv"
trajectories_file = "trajectories(table 5)_training.csv"
volume_file = "volume(table 6)_training.csv"
weather_file = "weather (table 7)_training.csv"
routes_df = pd.read_csv(training_files+routes_file)
links_df = pd.read_csv(training_files+links_file)
weather_df = pd.read_csv(training_files+weather_file)
volume_df = pd.read_csv(training_files+volume_file)
training_files = "../../new_dataset/training/"
trajectories_df = pd.read_csv(training_files+trajectories_file)
In [3]:
routes_df
Out[3]:
In [4]:
df[df.index.duplicated()]
Out[4]: