In [3]:
import numpy as np, pandas as pd, os
from synthicity.utils import misc
from drcog.models import elcm_simulation, hlcm_simulation, regression_model_simulation, dataset
dset = dataset.DRCOGDataset(os.path.join(misc.data_dir(),'drcog.h5'))
parcels = dset.parcels


Fetching parcels
Fetching modify_table

In [6]:
dset.store.parcels


Out[6]:
<class 'pandas.core.frame.DataFrame'>
Int64Index: 949484 entries, 1 to 1128935
Data columns (total 23 columns):
county_id                949484  non-null values
parcel_sqft              949484  non-null values
land_value               949484  non-null values
zone_id                  949484  non-null values
city_id                  949484  non-null values
gen_lu_type_id           949484  non-null values
lu_type_id               949484  non-null values
tax_exempt_flag          949484  non-null values
school_district          949484  non-null values
zoning_id                949484  non-null values
dist_bus                 949484  non-null values
dist_rail                949484  non-null values
in_ugb                   949484  non-null values
in_uga                   949484  non-null values
env_constr_park          949484  non-null values
env_constr_lake          949484  non-null values
env_constr_floodplain    949484  non-null values
env_constr_river         949484  non-null values
env_constr_landslide     949484  non-null values
far_id                   949484  non-null values
prop_constrained         949484  non-null values
centroid_x               949484  non-null values
centroid_y               949484  non-null values
dtypes: float32(7), int32(14), int64(2)

In [3]:
misc.data_dir()


Out[3]:
'c:\\urbansim\\data'

In [1]:
parcels.columns


---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-1-e098aa358884> in <module>()
----> 1 parcels.columns

NameError: name 'parcels' is not defined

In [4]:


In [5]:
parcels = parcels.sort_index()

In [6]:
import psycopg2
import pandas.io.sql as sql
conn_string = "host='paris.urbansim.org' port=5433 dbname='denver' user='drcog' password='M0untains#'"
conn = psycopg2.connect(conn_string)
cur = conn.cursor()
parcels_ref = sql.read_frame('select parcel_id, parcel_sqft,centroid_x,centroid_y from parcels_for_reference',conn)

In [7]:
parcels_ref = parcels_ref.set_index('parcel_id')
parcels_ref = parcels_ref.sort_index()

In [8]:
parcels_ref.tail()


Out[8]:
parcel_sqft centroid_x centroid_y
parcel_id
1128930 57444 3253951 1557284
1128932 108764 3260487 1568146
1128933 38235 3260421 1568760
1128934 113718 3260292 1565251
1128935 24011 3256371 1569931

In [9]:
parcels[['parcel_sqft']].tail()


Out[9]:
parcel_sqft
parcel_id
1128930 0
1128932 1636528
1128933 3187557
1128934 113718
1128935 1707626

In [10]:
parcels['centroid_x'] = parcels_ref.centroid_x
parcels['centroid_y'] = parcels_ref.centroid_y

In [11]:
parcels[['parcel_sqft','centroid_x','centroid_y']].head()


Out[11]:
parcel_sqft centroid_x centroid_y
parcel_id
1 20479 3174135 1695429
2 17777 3180889 1695592
3 59025 3175519 1699844
4 1640178 3192128 1747750
5 0 3154372 1747898

In [12]:
parcels_ref.head()


Out[12]:
parcel_sqft centroid_x centroid_y
parcel_id
1 20479 3174135 1695429
2 17777 3180889 1695592
3 59025 3175519 1699844
4 285497 3192128 1747750
5 27156 3154372 1747898

In [13]:
store = pd.HDFStore('c:\\urbansim\\data\\drcog.h5')

In [14]:
store['parcels'] = parcels

In [15]:
store.close()