Run this script to make sure that the make_clean_data functions are working properly. Warning some of them may take a while (particularly the functions that go through the whole edgelist).


In [1]:
import sys

sys.path.append('../../code/')
import os
import json
from datetime import datetime
import time

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import scipy.stats as stats

import networkx as nx

%load_ext autoreload
%autoreload 2
%matplotlib inline

data_dir = '../../data/'

In [ ]:
from make_clean_data import *

In [5]:
make_clean_case_metadata(data_dir)

In [ ]:
start = time.time()
make_clean_edgelist(data_dir, overwrite=True)
end = time.time()
print 'took %d seconds' % (end - start)

In [21]:
make_clean_jurisdiction_file(data_dir)

In [6]:
make_jurisdiction_edgelist(data_dir)

In [22]:


In [21]:


In [ ]: