In [1]:
import os
import settings
import pandas as pd

All of them


In [2]:
filings = pd.read_csv(os.path.join(settings.data_dir, "filings.csv"))

In [3]:
sched_d = pd.read_sql_table("calaccess_processed_form460scheduleditem", settings.db_connection)

In [6]:
d_items = pd.merge(filings, sched_d, how="inner", left_on="calaccess_filing_id", right_on="filing_id")

In [7]:
d_items.to_csv(os.path.join(settings.data_dir, 'transfers.csv'), index=False)

2016


In [8]:
recent_filings = pd.read_csv(os.path.join(settings.data_dir, "filings-2016.csv"))

In [11]:
recent_d_items = pd.merge(recent_filings, sched_d, how="inner", left_on="calaccess_filing_id", right_on="filing_id")

In [12]:
recent_d_items.to_csv(os.path.join(settings.data_dir, 'transfers-2016.csv'), index=False)