In [1]:
import pandas as pd
import datetime
import numpy as np

Loading Production Data from 1987 to 2008

The production data from these years follows the same file format.

We can therefore import using the same format and put the dataframes into a dictionary.

In 1990 we manually fix well API No: 21451, DUCKETT "A" and set it's well number to 1 as unspecified. Same in 1991.


In [2]:
dates_cols_oil = ["OIL."+str(i) for i in range(0, 12, 1)]
dates_cols_gas = ["GAS."+str(i)  for i in range(0, 12, 1)]
dates_cols = dates_cols_oil + dates_cols_gas
headers_old_2003 = ['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME','WELL_NO', '  OPER_NO', 'OPER_SUFFIX',
       'OPERATOR', 'ME', 'SECTION', 'TWP','RAN', 'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
           'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE','FORMATION', 'OFB', 'ALLOWABLE_CLASS',
       'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1',
       'YEAR', 'JAN', 'OIL.0', 'GAS.0', 'FEB',
       'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2',
       'APR', 'OIL.3', 'GAS.3', 'MAY', 'OIL.4',
       'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7',
       'SEP', 'OIL.8', 'GAS.8', 'OCT', 'OIL.9',
       'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC',
       'OIL.11', 'GAS.11']
headers_new_2004 = ['API_COUNTY', 'API_NUMBER', 'S', 'WELL_NAME','WELL_NO', '  OPER_NO',
       'OPERATOR', 'ME', 'SECTION', 'TWP','RAN', 'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
           'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE','FORMATION','ALLOWABLE_CLASS',
       'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'OFB.1',
       'YEAR', 'JAN', 'OIL.0', 'GAS.0', 'FEB',
       'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2',
       'APR', 'OIL.3', 'GAS.3', 'MAY', 'OIL.4',
       'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7',
       'SEP', 'OIL.8', 'GAS.8', 'OCT', 'OIL.9',
       'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC',
       'OIL.11', 'GAS.11']
df_in = None
production_data = {}
for i in range(1987, 2016, 1):
    dates_oil = [ "OIL_"+str(datetime.date(i, j+1, 1)) for j in range(0, 12, 1)]
    dates_gas = [ "GAS_"+str(datetime.date(i, j+1, 1)) for j in range(0, 12, 1)]
    renamed_oil = {old: new for old, new in zip(dates_cols_oil, dates_oil)}
    renamed_gas = {old: new for old, new in zip(dates_cols_gas, dates_gas)}
    renamed_cols = {**renamed_oil, **renamed_gas}
    #print(renamed_cols)
    if i != 1994: #No Data from 1994
        print(i)
        if i <= 2008:
            df = None
            if i < 2004:
                df = pd.read_csv("../raw/"+str(i)+"prodn.txt", delimiter="|", skiprows=[0, 2], names=headers_old_2003)
            else:
                df = pd.read_csv("../raw/"+str(i)+"prodn.txt", delimiter="|", skiprows=[0, 2], names=headers_new_2004)
            df_in = df.copy()
            print(df.columns)
            print(renamed_cols)
            df.rename(index=str, columns=renamed_cols, inplace=True)
            df = df.drop(['YEAR','JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL','AUG', 'SEP', 'OCT', 'NOV', 'DEC'], axis=1)
            production_data[i] = df
        else:
            df = pd.read_csv("../raw/"+str(i)+"prodn.txt", delimiter="|")
            df[["API_COUNTY", "API_NUMBER"]].apply(lambda x: pd.to_numeric(x, errors='coerce',downcast='integer'))
            df_in = df.copy()
            df.rename(renamed_cols)
            production_data[i] = df
df_in.head()


1987
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1987-04-01', 'GAS.11': 'GAS_1987-12-01', 'OIL.6': 'OIL_1987-07-01', 'GAS.8': 'GAS_1987-09-01', 'OIL.8': 'OIL_1987-09-01', 'GAS.7': 'GAS_1987-08-01', 'GAS.2': 'GAS_1987-03-01', 'GAS.1': 'GAS_1987-02-01', 'OIL.0': 'OIL_1987-01-01', 'GAS.5': 'GAS_1987-06-01', 'OIL.2': 'OIL_1987-03-01', 'OIL.5': 'OIL_1987-06-01', 'OIL.11': 'OIL_1987-12-01', 'GAS.0': 'GAS_1987-01-01', 'OIL.4': 'OIL_1987-05-01', 'GAS.4': 'GAS_1987-05-01', 'GAS.9': 'GAS_1987-10-01', 'GAS.6': 'GAS_1987-07-01', 'OIL.3': 'OIL_1987-04-01', 'OIL.7': 'OIL_1987-08-01', 'OIL.1': 'OIL_1987-02-01', 'GAS.10': 'GAS_1987-11-01', 'OIL.10': 'OIL_1987-11-01', 'OIL.9': 'OIL_1987-10-01'}
1988
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1988-04-01', 'GAS.11': 'GAS_1988-12-01', 'OIL.6': 'OIL_1988-07-01', 'GAS.8': 'GAS_1988-09-01', 'OIL.8': 'OIL_1988-09-01', 'GAS.7': 'GAS_1988-08-01', 'GAS.2': 'GAS_1988-03-01', 'GAS.1': 'GAS_1988-02-01', 'OIL.0': 'OIL_1988-01-01', 'GAS.5': 'GAS_1988-06-01', 'OIL.2': 'OIL_1988-03-01', 'OIL.5': 'OIL_1988-06-01', 'OIL.11': 'OIL_1988-12-01', 'GAS.0': 'GAS_1988-01-01', 'OIL.4': 'OIL_1988-05-01', 'GAS.4': 'GAS_1988-05-01', 'GAS.9': 'GAS_1988-10-01', 'GAS.6': 'GAS_1988-07-01', 'OIL.3': 'OIL_1988-04-01', 'OIL.7': 'OIL_1988-08-01', 'OIL.1': 'OIL_1988-02-01', 'GAS.10': 'GAS_1988-11-01', 'OIL.10': 'OIL_1988-11-01', 'OIL.9': 'OIL_1988-10-01'}
1989
E:\Anaconda3\lib\site-packages\IPython\core\interactiveshell.py:2717: DtypeWarning: Columns (0,1,5,6,9,16,17,18,19,20,21,28,30,32,33,36,39,42,45,48,51,54,57,60,63,66) have mixed types. Specify dtype option on import or set low_memory=False.
  interactivity=interactivity, compiler=compiler, result=result)
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1989-04-01', 'GAS.11': 'GAS_1989-12-01', 'OIL.6': 'OIL_1989-07-01', 'GAS.8': 'GAS_1989-09-01', 'OIL.8': 'OIL_1989-09-01', 'GAS.7': 'GAS_1989-08-01', 'GAS.2': 'GAS_1989-03-01', 'GAS.1': 'GAS_1989-02-01', 'OIL.0': 'OIL_1989-01-01', 'GAS.5': 'GAS_1989-06-01', 'OIL.2': 'OIL_1989-03-01', 'OIL.5': 'OIL_1989-06-01', 'OIL.11': 'OIL_1989-12-01', 'GAS.0': 'GAS_1989-01-01', 'OIL.4': 'OIL_1989-05-01', 'GAS.4': 'GAS_1989-05-01', 'GAS.9': 'GAS_1989-10-01', 'GAS.6': 'GAS_1989-07-01', 'OIL.3': 'OIL_1989-04-01', 'OIL.7': 'OIL_1989-08-01', 'OIL.1': 'OIL_1989-02-01', 'GAS.10': 'GAS_1989-11-01', 'OIL.10': 'OIL_1989-11-01', 'OIL.9': 'OIL_1989-10-01'}
1990
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1990-04-01', 'GAS.11': 'GAS_1990-12-01', 'OIL.6': 'OIL_1990-07-01', 'GAS.8': 'GAS_1990-09-01', 'OIL.8': 'OIL_1990-09-01', 'GAS.7': 'GAS_1990-08-01', 'GAS.2': 'GAS_1990-03-01', 'GAS.1': 'GAS_1990-02-01', 'OIL.0': 'OIL_1990-01-01', 'GAS.5': 'GAS_1990-06-01', 'OIL.2': 'OIL_1990-03-01', 'OIL.5': 'OIL_1990-06-01', 'OIL.11': 'OIL_1990-12-01', 'GAS.0': 'GAS_1990-01-01', 'OIL.4': 'OIL_1990-05-01', 'GAS.4': 'GAS_1990-05-01', 'GAS.9': 'GAS_1990-10-01', 'GAS.6': 'GAS_1990-07-01', 'OIL.3': 'OIL_1990-04-01', 'OIL.7': 'OIL_1990-08-01', 'OIL.1': 'OIL_1990-02-01', 'GAS.10': 'GAS_1990-11-01', 'OIL.10': 'OIL_1990-11-01', 'OIL.9': 'OIL_1990-10-01'}
1991
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1991-04-01', 'GAS.11': 'GAS_1991-12-01', 'OIL.6': 'OIL_1991-07-01', 'GAS.8': 'GAS_1991-09-01', 'OIL.8': 'OIL_1991-09-01', 'GAS.7': 'GAS_1991-08-01', 'GAS.2': 'GAS_1991-03-01', 'GAS.1': 'GAS_1991-02-01', 'OIL.0': 'OIL_1991-01-01', 'GAS.5': 'GAS_1991-06-01', 'OIL.2': 'OIL_1991-03-01', 'OIL.5': 'OIL_1991-06-01', 'OIL.11': 'OIL_1991-12-01', 'GAS.0': 'GAS_1991-01-01', 'OIL.4': 'OIL_1991-05-01', 'GAS.4': 'GAS_1991-05-01', 'GAS.9': 'GAS_1991-10-01', 'GAS.6': 'GAS_1991-07-01', 'OIL.3': 'OIL_1991-04-01', 'OIL.7': 'OIL_1991-08-01', 'OIL.1': 'OIL_1991-02-01', 'GAS.10': 'GAS_1991-11-01', 'OIL.10': 'OIL_1991-11-01', 'OIL.9': 'OIL_1991-10-01'}
1992
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1992-04-01', 'GAS.11': 'GAS_1992-12-01', 'OIL.6': 'OIL_1992-07-01', 'GAS.8': 'GAS_1992-09-01', 'OIL.8': 'OIL_1992-09-01', 'GAS.7': 'GAS_1992-08-01', 'GAS.2': 'GAS_1992-03-01', 'GAS.1': 'GAS_1992-02-01', 'OIL.0': 'OIL_1992-01-01', 'GAS.5': 'GAS_1992-06-01', 'OIL.2': 'OIL_1992-03-01', 'OIL.5': 'OIL_1992-06-01', 'OIL.11': 'OIL_1992-12-01', 'GAS.0': 'GAS_1992-01-01', 'OIL.4': 'OIL_1992-05-01', 'GAS.4': 'GAS_1992-05-01', 'GAS.9': 'GAS_1992-10-01', 'GAS.6': 'GAS_1992-07-01', 'OIL.3': 'OIL_1992-04-01', 'OIL.7': 'OIL_1992-08-01', 'OIL.1': 'OIL_1992-02-01', 'GAS.10': 'GAS_1992-11-01', 'OIL.10': 'OIL_1992-11-01', 'OIL.9': 'OIL_1992-10-01'}
1993
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1993-04-01', 'GAS.11': 'GAS_1993-12-01', 'OIL.6': 'OIL_1993-07-01', 'GAS.8': 'GAS_1993-09-01', 'OIL.8': 'OIL_1993-09-01', 'GAS.7': 'GAS_1993-08-01', 'GAS.2': 'GAS_1993-03-01', 'GAS.1': 'GAS_1993-02-01', 'OIL.0': 'OIL_1993-01-01', 'GAS.5': 'GAS_1993-06-01', 'OIL.2': 'OIL_1993-03-01', 'OIL.5': 'OIL_1993-06-01', 'OIL.11': 'OIL_1993-12-01', 'GAS.0': 'GAS_1993-01-01', 'OIL.4': 'OIL_1993-05-01', 'GAS.4': 'GAS_1993-05-01', 'GAS.9': 'GAS_1993-10-01', 'GAS.6': 'GAS_1993-07-01', 'OIL.3': 'OIL_1993-04-01', 'OIL.7': 'OIL_1993-08-01', 'OIL.1': 'OIL_1993-02-01', 'GAS.10': 'GAS_1993-11-01', 'OIL.10': 'OIL_1993-11-01', 'OIL.9': 'OIL_1993-10-01'}
1995
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1995-04-01', 'GAS.11': 'GAS_1995-12-01', 'OIL.6': 'OIL_1995-07-01', 'GAS.8': 'GAS_1995-09-01', 'OIL.8': 'OIL_1995-09-01', 'GAS.7': 'GAS_1995-08-01', 'GAS.2': 'GAS_1995-03-01', 'GAS.1': 'GAS_1995-02-01', 'OIL.0': 'OIL_1995-01-01', 'GAS.5': 'GAS_1995-06-01', 'OIL.2': 'OIL_1995-03-01', 'OIL.5': 'OIL_1995-06-01', 'OIL.11': 'OIL_1995-12-01', 'GAS.0': 'GAS_1995-01-01', 'OIL.4': 'OIL_1995-05-01', 'GAS.4': 'GAS_1995-05-01', 'GAS.9': 'GAS_1995-10-01', 'GAS.6': 'GAS_1995-07-01', 'OIL.3': 'OIL_1995-04-01', 'OIL.7': 'OIL_1995-08-01', 'OIL.1': 'OIL_1995-02-01', 'GAS.10': 'GAS_1995-11-01', 'OIL.10': 'OIL_1995-11-01', 'OIL.9': 'OIL_1995-10-01'}
1996
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1996-04-01', 'GAS.11': 'GAS_1996-12-01', 'OIL.6': 'OIL_1996-07-01', 'GAS.8': 'GAS_1996-09-01', 'OIL.8': 'OIL_1996-09-01', 'GAS.7': 'GAS_1996-08-01', 'GAS.2': 'GAS_1996-03-01', 'GAS.1': 'GAS_1996-02-01', 'OIL.0': 'OIL_1996-01-01', 'GAS.5': 'GAS_1996-06-01', 'OIL.2': 'OIL_1996-03-01', 'OIL.5': 'OIL_1996-06-01', 'OIL.11': 'OIL_1996-12-01', 'GAS.0': 'GAS_1996-01-01', 'OIL.4': 'OIL_1996-05-01', 'GAS.4': 'GAS_1996-05-01', 'GAS.9': 'GAS_1996-10-01', 'GAS.6': 'GAS_1996-07-01', 'OIL.3': 'OIL_1996-04-01', 'OIL.7': 'OIL_1996-08-01', 'OIL.1': 'OIL_1996-02-01', 'GAS.10': 'GAS_1996-11-01', 'OIL.10': 'OIL_1996-11-01', 'OIL.9': 'OIL_1996-10-01'}
1997
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1997-04-01', 'GAS.11': 'GAS_1997-12-01', 'OIL.6': 'OIL_1997-07-01', 'GAS.8': 'GAS_1997-09-01', 'OIL.8': 'OIL_1997-09-01', 'GAS.7': 'GAS_1997-08-01', 'GAS.2': 'GAS_1997-03-01', 'GAS.1': 'GAS_1997-02-01', 'OIL.0': 'OIL_1997-01-01', 'GAS.5': 'GAS_1997-06-01', 'OIL.2': 'OIL_1997-03-01', 'OIL.5': 'OIL_1997-06-01', 'OIL.11': 'OIL_1997-12-01', 'GAS.0': 'GAS_1997-01-01', 'OIL.4': 'OIL_1997-05-01', 'GAS.4': 'GAS_1997-05-01', 'GAS.9': 'GAS_1997-10-01', 'GAS.6': 'GAS_1997-07-01', 'OIL.3': 'OIL_1997-04-01', 'OIL.7': 'OIL_1997-08-01', 'OIL.1': 'OIL_1997-02-01', 'GAS.10': 'GAS_1997-11-01', 'OIL.10': 'OIL_1997-11-01', 'OIL.9': 'OIL_1997-10-01'}
1998
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1998-04-01', 'GAS.11': 'GAS_1998-12-01', 'OIL.6': 'OIL_1998-07-01', 'GAS.8': 'GAS_1998-09-01', 'OIL.8': 'OIL_1998-09-01', 'GAS.7': 'GAS_1998-08-01', 'GAS.2': 'GAS_1998-03-01', 'GAS.1': 'GAS_1998-02-01', 'OIL.0': 'OIL_1998-01-01', 'GAS.5': 'GAS_1998-06-01', 'OIL.2': 'OIL_1998-03-01', 'OIL.5': 'OIL_1998-06-01', 'OIL.11': 'OIL_1998-12-01', 'GAS.0': 'GAS_1998-01-01', 'OIL.4': 'OIL_1998-05-01', 'GAS.4': 'GAS_1998-05-01', 'GAS.9': 'GAS_1998-10-01', 'GAS.6': 'GAS_1998-07-01', 'OIL.3': 'OIL_1998-04-01', 'OIL.7': 'OIL_1998-08-01', 'OIL.1': 'OIL_1998-02-01', 'GAS.10': 'GAS_1998-11-01', 'OIL.10': 'OIL_1998-11-01', 'OIL.9': 'OIL_1998-10-01'}
1999
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_1999-04-01', 'GAS.11': 'GAS_1999-12-01', 'OIL.6': 'OIL_1999-07-01', 'GAS.8': 'GAS_1999-09-01', 'OIL.8': 'OIL_1999-09-01', 'GAS.7': 'GAS_1999-08-01', 'GAS.2': 'GAS_1999-03-01', 'GAS.1': 'GAS_1999-02-01', 'OIL.0': 'OIL_1999-01-01', 'GAS.5': 'GAS_1999-06-01', 'OIL.2': 'OIL_1999-03-01', 'OIL.5': 'OIL_1999-06-01', 'OIL.11': 'OIL_1999-12-01', 'GAS.0': 'GAS_1999-01-01', 'OIL.4': 'OIL_1999-05-01', 'GAS.4': 'GAS_1999-05-01', 'GAS.9': 'GAS_1999-10-01', 'GAS.6': 'GAS_1999-07-01', 'OIL.3': 'OIL_1999-04-01', 'OIL.7': 'OIL_1999-08-01', 'OIL.1': 'OIL_1999-02-01', 'GAS.10': 'GAS_1999-11-01', 'OIL.10': 'OIL_1999-11-01', 'OIL.9': 'OIL_1999-10-01'}
2000
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2000-04-01', 'GAS.11': 'GAS_2000-12-01', 'OIL.6': 'OIL_2000-07-01', 'GAS.8': 'GAS_2000-09-01', 'OIL.8': 'OIL_2000-09-01', 'GAS.7': 'GAS_2000-08-01', 'GAS.2': 'GAS_2000-03-01', 'GAS.1': 'GAS_2000-02-01', 'OIL.0': 'OIL_2000-01-01', 'GAS.5': 'GAS_2000-06-01', 'OIL.2': 'OIL_2000-03-01', 'OIL.5': 'OIL_2000-06-01', 'OIL.11': 'OIL_2000-12-01', 'GAS.0': 'GAS_2000-01-01', 'OIL.4': 'OIL_2000-05-01', 'GAS.4': 'GAS_2000-05-01', 'GAS.9': 'GAS_2000-10-01', 'GAS.6': 'GAS_2000-07-01', 'OIL.3': 'OIL_2000-04-01', 'OIL.7': 'OIL_2000-08-01', 'OIL.1': 'OIL_2000-02-01', 'GAS.10': 'GAS_2000-11-01', 'OIL.10': 'OIL_2000-11-01', 'OIL.9': 'OIL_2000-10-01'}
2001
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2001-04-01', 'GAS.11': 'GAS_2001-12-01', 'OIL.6': 'OIL_2001-07-01', 'GAS.8': 'GAS_2001-09-01', 'OIL.8': 'OIL_2001-09-01', 'GAS.7': 'GAS_2001-08-01', 'GAS.2': 'GAS_2001-03-01', 'GAS.1': 'GAS_2001-02-01', 'OIL.0': 'OIL_2001-01-01', 'GAS.5': 'GAS_2001-06-01', 'OIL.2': 'OIL_2001-03-01', 'OIL.5': 'OIL_2001-06-01', 'OIL.11': 'OIL_2001-12-01', 'GAS.0': 'GAS_2001-01-01', 'OIL.4': 'OIL_2001-05-01', 'GAS.4': 'GAS_2001-05-01', 'GAS.9': 'GAS_2001-10-01', 'GAS.6': 'GAS_2001-07-01', 'OIL.3': 'OIL_2001-04-01', 'OIL.7': 'OIL_2001-08-01', 'OIL.1': 'OIL_2001-02-01', 'GAS.10': 'GAS_2001-11-01', 'OIL.10': 'OIL_2001-11-01', 'OIL.9': 'OIL_2001-10-01'}
2002
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2002-04-01', 'GAS.11': 'GAS_2002-12-01', 'OIL.6': 'OIL_2002-07-01', 'GAS.8': 'GAS_2002-09-01', 'OIL.8': 'OIL_2002-09-01', 'GAS.7': 'GAS_2002-08-01', 'GAS.2': 'GAS_2002-03-01', 'GAS.1': 'GAS_2002-02-01', 'OIL.0': 'OIL_2002-01-01', 'GAS.5': 'GAS_2002-06-01', 'OIL.2': 'OIL_2002-03-01', 'OIL.5': 'OIL_2002-06-01', 'OIL.11': 'OIL_2002-12-01', 'GAS.0': 'GAS_2002-01-01', 'OIL.4': 'OIL_2002-05-01', 'GAS.4': 'GAS_2002-05-01', 'GAS.9': 'GAS_2002-10-01', 'GAS.6': 'GAS_2002-07-01', 'OIL.3': 'OIL_2002-04-01', 'OIL.7': 'OIL_2002-08-01', 'OIL.1': 'OIL_2002-02-01', 'GAS.10': 'GAS_2002-11-01', 'OIL.10': 'OIL_2002-11-01', 'OIL.9': 'OIL_2002-10-01'}
2003
Index(['API_COUNTY', 'API_NUMBER', 'SUFFIX', 'WELL_NAME', 'WELL_NO',
       '  OPER_NO', 'OPER_SUFFIX', 'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN',
       'Q4', 'Q3', 'Q2', 'Q1', 'LATITUDE', 'LONGITUDE', 'OTC_COUNTY',
       'OTC_LEASE_NO', 'OTC_SUB_NO', 'OTC_MERGE', 'POOL_NO', 'CODE',
       'FORMATION', 'OFB', 'ALLOWABLE_CLASS', 'ALLOWABLE_TYPE', ' PURCH_NO',
       'PURCHASER', 'PURCH_SUFFIX', 'OFB.1', 'YEAR', 'JAN', 'OIL.0', 'GAS.0',
       'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2', 'APR', 'OIL.3',
       'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5', 'GAS.5', 'JUL',
       'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP', 'OIL.8', 'GAS.8',
       'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10', 'DEC', 'OIL.11',
       'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2003-04-01', 'GAS.11': 'GAS_2003-12-01', 'OIL.6': 'OIL_2003-07-01', 'GAS.8': 'GAS_2003-09-01', 'OIL.8': 'OIL_2003-09-01', 'GAS.7': 'GAS_2003-08-01', 'GAS.2': 'GAS_2003-03-01', 'GAS.1': 'GAS_2003-02-01', 'OIL.0': 'OIL_2003-01-01', 'GAS.5': 'GAS_2003-06-01', 'OIL.2': 'OIL_2003-03-01', 'OIL.5': 'OIL_2003-06-01', 'OIL.11': 'OIL_2003-12-01', 'GAS.0': 'GAS_2003-01-01', 'OIL.4': 'OIL_2003-05-01', 'GAS.4': 'GAS_2003-05-01', 'GAS.9': 'GAS_2003-10-01', 'GAS.6': 'GAS_2003-07-01', 'OIL.3': 'OIL_2003-04-01', 'OIL.7': 'OIL_2003-08-01', 'OIL.1': 'OIL_2003-02-01', 'GAS.10': 'GAS_2003-11-01', 'OIL.10': 'OIL_2003-11-01', 'OIL.9': 'OIL_2003-10-01'}
2004
E:\Anaconda3\lib\site-packages\IPython\core\interactiveshell.py:2717: DtypeWarning: Columns (0,1,5,8,15,16,17,18,19,20,27,29,30,33,36,39) have mixed types. Specify dtype option on import or set low_memory=False.
  interactivity=interactivity, compiler=compiler, result=result)
Index(['API_COUNTY', 'API_NUMBER', 'S', 'WELL_NAME', 'WELL_NO', '  OPER_NO',
       'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN', 'Q4', 'Q3', 'Q2', 'Q1',
       'LATITUDE', 'LONGITUDE', 'OTC_COUNTY', 'OTC_LEASE_NO', 'OTC_SUB_NO',
       'OTC_MERGE', 'POOL_NO', 'CODE', 'FORMATION', 'ALLOWABLE_CLASS',
       'ALLOWABLE_TYPE', ' PURCH_NO', 'PURCHASER', 'OFB.1', 'YEAR', 'JAN',
       'OIL.0', 'GAS.0', 'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2',
       'APR', 'OIL.3', 'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5',
       'GAS.5', 'JUL', 'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP',
       'OIL.8', 'GAS.8', 'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10',
       'DEC', 'OIL.11', 'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2004-04-01', 'GAS.11': 'GAS_2004-12-01', 'OIL.6': 'OIL_2004-07-01', 'GAS.8': 'GAS_2004-09-01', 'OIL.8': 'OIL_2004-09-01', 'GAS.7': 'GAS_2004-08-01', 'GAS.2': 'GAS_2004-03-01', 'GAS.1': 'GAS_2004-02-01', 'OIL.0': 'OIL_2004-01-01', 'GAS.5': 'GAS_2004-06-01', 'OIL.2': 'OIL_2004-03-01', 'OIL.5': 'OIL_2004-06-01', 'OIL.11': 'OIL_2004-12-01', 'GAS.0': 'GAS_2004-01-01', 'OIL.4': 'OIL_2004-05-01', 'GAS.4': 'GAS_2004-05-01', 'GAS.9': 'GAS_2004-10-01', 'GAS.6': 'GAS_2004-07-01', 'OIL.3': 'OIL_2004-04-01', 'OIL.7': 'OIL_2004-08-01', 'OIL.1': 'OIL_2004-02-01', 'GAS.10': 'GAS_2004-11-01', 'OIL.10': 'OIL_2004-11-01', 'OIL.9': 'OIL_2004-10-01'}
2005
E:\Anaconda3\lib\site-packages\IPython\core\interactiveshell.py:2717: DtypeWarning: Columns (0,1,5,8,15,16,17,18,19,20,27,29,30) have mixed types. Specify dtype option on import or set low_memory=False.
  interactivity=interactivity, compiler=compiler, result=result)
Index(['API_COUNTY', 'API_NUMBER', 'S', 'WELL_NAME', 'WELL_NO', '  OPER_NO',
       'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN', 'Q4', 'Q3', 'Q2', 'Q1',
       'LATITUDE', 'LONGITUDE', 'OTC_COUNTY', 'OTC_LEASE_NO', 'OTC_SUB_NO',
       'OTC_MERGE', 'POOL_NO', 'CODE', 'FORMATION', 'ALLOWABLE_CLASS',
       'ALLOWABLE_TYPE', ' PURCH_NO', 'PURCHASER', 'OFB.1', 'YEAR', 'JAN',
       'OIL.0', 'GAS.0', 'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2',
       'APR', 'OIL.3', 'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5',
       'GAS.5', 'JUL', 'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP',
       'OIL.8', 'GAS.8', 'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10',
       'DEC', 'OIL.11', 'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2005-04-01', 'GAS.11': 'GAS_2005-12-01', 'OIL.6': 'OIL_2005-07-01', 'GAS.8': 'GAS_2005-09-01', 'OIL.8': 'OIL_2005-09-01', 'GAS.7': 'GAS_2005-08-01', 'GAS.2': 'GAS_2005-03-01', 'GAS.1': 'GAS_2005-02-01', 'OIL.0': 'OIL_2005-01-01', 'GAS.5': 'GAS_2005-06-01', 'OIL.2': 'OIL_2005-03-01', 'OIL.5': 'OIL_2005-06-01', 'OIL.11': 'OIL_2005-12-01', 'GAS.0': 'GAS_2005-01-01', 'OIL.4': 'OIL_2005-05-01', 'GAS.4': 'GAS_2005-05-01', 'GAS.9': 'GAS_2005-10-01', 'GAS.6': 'GAS_2005-07-01', 'OIL.3': 'OIL_2005-04-01', 'OIL.7': 'OIL_2005-08-01', 'OIL.1': 'OIL_2005-02-01', 'GAS.10': 'GAS_2005-11-01', 'OIL.10': 'OIL_2005-11-01', 'OIL.9': 'OIL_2005-10-01'}
2006
Index(['API_COUNTY', 'API_NUMBER', 'S', 'WELL_NAME', 'WELL_NO', '  OPER_NO',
       'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN', 'Q4', 'Q3', 'Q2', 'Q1',
       'LATITUDE', 'LONGITUDE', 'OTC_COUNTY', 'OTC_LEASE_NO', 'OTC_SUB_NO',
       'OTC_MERGE', 'POOL_NO', 'CODE', 'FORMATION', 'ALLOWABLE_CLASS',
       'ALLOWABLE_TYPE', ' PURCH_NO', 'PURCHASER', 'OFB.1', 'YEAR', 'JAN',
       'OIL.0', 'GAS.0', 'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2',
       'APR', 'OIL.3', 'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5',
       'GAS.5', 'JUL', 'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP',
       'OIL.8', 'GAS.8', 'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10',
       'DEC', 'OIL.11', 'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2006-04-01', 'GAS.11': 'GAS_2006-12-01', 'OIL.6': 'OIL_2006-07-01', 'GAS.8': 'GAS_2006-09-01', 'OIL.8': 'OIL_2006-09-01', 'GAS.7': 'GAS_2006-08-01', 'GAS.2': 'GAS_2006-03-01', 'GAS.1': 'GAS_2006-02-01', 'OIL.0': 'OIL_2006-01-01', 'GAS.5': 'GAS_2006-06-01', 'OIL.2': 'OIL_2006-03-01', 'OIL.5': 'OIL_2006-06-01', 'OIL.11': 'OIL_2006-12-01', 'GAS.0': 'GAS_2006-01-01', 'OIL.4': 'OIL_2006-05-01', 'GAS.4': 'GAS_2006-05-01', 'GAS.9': 'GAS_2006-10-01', 'GAS.6': 'GAS_2006-07-01', 'OIL.3': 'OIL_2006-04-01', 'OIL.7': 'OIL_2006-08-01', 'OIL.1': 'OIL_2006-02-01', 'GAS.10': 'GAS_2006-11-01', 'OIL.10': 'OIL_2006-11-01', 'OIL.9': 'OIL_2006-10-01'}
2007
E:\Anaconda3\lib\site-packages\IPython\core\interactiveshell.py:2717: DtypeWarning: Columns (0,1,5,8,15,16,17,18,19,20,27,29,30,33,36) have mixed types. Specify dtype option on import or set low_memory=False.
  interactivity=interactivity, compiler=compiler, result=result)
Index(['API_COUNTY', 'API_NUMBER', 'S', 'WELL_NAME', 'WELL_NO', '  OPER_NO',
       'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN', 'Q4', 'Q3', 'Q2', 'Q1',
       'LATITUDE', 'LONGITUDE', 'OTC_COUNTY', 'OTC_LEASE_NO', 'OTC_SUB_NO',
       'OTC_MERGE', 'POOL_NO', 'CODE', 'FORMATION', 'ALLOWABLE_CLASS',
       'ALLOWABLE_TYPE', ' PURCH_NO', 'PURCHASER', 'OFB.1', 'YEAR', 'JAN',
       'OIL.0', 'GAS.0', 'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2',
       'APR', 'OIL.3', 'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5',
       'GAS.5', 'JUL', 'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP',
       'OIL.8', 'GAS.8', 'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10',
       'DEC', 'OIL.11', 'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2007-04-01', 'GAS.11': 'GAS_2007-12-01', 'OIL.6': 'OIL_2007-07-01', 'GAS.8': 'GAS_2007-09-01', 'OIL.8': 'OIL_2007-09-01', 'GAS.7': 'GAS_2007-08-01', 'GAS.2': 'GAS_2007-03-01', 'GAS.1': 'GAS_2007-02-01', 'OIL.0': 'OIL_2007-01-01', 'GAS.5': 'GAS_2007-06-01', 'OIL.2': 'OIL_2007-03-01', 'OIL.5': 'OIL_2007-06-01', 'OIL.11': 'OIL_2007-12-01', 'GAS.0': 'GAS_2007-01-01', 'OIL.4': 'OIL_2007-05-01', 'GAS.4': 'GAS_2007-05-01', 'GAS.9': 'GAS_2007-10-01', 'GAS.6': 'GAS_2007-07-01', 'OIL.3': 'OIL_2007-04-01', 'OIL.7': 'OIL_2007-08-01', 'OIL.1': 'OIL_2007-02-01', 'GAS.10': 'GAS_2007-11-01', 'OIL.10': 'OIL_2007-11-01', 'OIL.9': 'OIL_2007-10-01'}
2008
Index(['API_COUNTY', 'API_NUMBER', 'S', 'WELL_NAME', 'WELL_NO', '  OPER_NO',
       'OPERATOR', 'ME', 'SECTION', 'TWP', 'RAN', 'Q4', 'Q3', 'Q2', 'Q1',
       'LATITUDE', 'LONGITUDE', 'OTC_COUNTY', 'OTC_LEASE_NO', 'OTC_SUB_NO',
       'OTC_MERGE', 'POOL_NO', 'CODE', 'FORMATION', 'ALLOWABLE_CLASS',
       'ALLOWABLE_TYPE', ' PURCH_NO', 'PURCHASER', 'OFB.1', 'YEAR', 'JAN',
       'OIL.0', 'GAS.0', 'FEB', 'OIL.1', 'GAS.1', 'MAR', 'OIL.2', 'GAS.2',
       'APR', 'OIL.3', 'GAS.3', 'MAY', 'OIL.4', 'GAS.4', 'JUN', 'OIL.5',
       'GAS.5', 'JUL', 'OIL.6', 'GAS.6', 'AUG', 'OIL.7', 'GAS.7', 'SEP',
       'OIL.8', 'GAS.8', 'OCT', 'OIL.9', 'GAS.9', 'NOV', 'OIL.10', 'GAS.10',
       'DEC', 'OIL.11', 'GAS.11'],
      dtype='object')
{'GAS.3': 'GAS_2008-04-01', 'GAS.11': 'GAS_2008-12-01', 'OIL.6': 'OIL_2008-07-01', 'GAS.8': 'GAS_2008-09-01', 'OIL.8': 'OIL_2008-09-01', 'GAS.7': 'GAS_2008-08-01', 'GAS.2': 'GAS_2008-03-01', 'GAS.1': 'GAS_2008-02-01', 'OIL.0': 'OIL_2008-01-01', 'GAS.5': 'GAS_2008-06-01', 'OIL.2': 'OIL_2008-03-01', 'OIL.5': 'OIL_2008-06-01', 'OIL.11': 'OIL_2008-12-01', 'GAS.0': 'GAS_2008-01-01', 'OIL.4': 'OIL_2008-05-01', 'GAS.4': 'GAS_2008-05-01', 'GAS.9': 'GAS_2008-10-01', 'GAS.6': 'GAS_2008-07-01', 'OIL.3': 'OIL_2008-04-01', 'OIL.7': 'OIL_2008-08-01', 'OIL.1': 'OIL_2008-02-01', 'GAS.10': 'GAS_2008-11-01', 'OIL.10': 'OIL_2008-11-01', 'OIL.9': 'OIL_2008-10-01'}
2009
2010
2011
2012
2013
2014
2015
Out[2]:
API_COUNTY API_NUMBER S WELL_NAME WELL_NO OPER_NO OPERATOR ME SECTION TWP ... GAS.8 OCT OIL.9 GAS.9 NOV OIL.10 GAS.10 DEC OIL.11 GAS.11
0 3 1 NaN KIRCHER 1 4030 CHAMPLIN EXPLORATION INC INDIAN 4 27N ... NaN 10 NaN NaN 11 NaN NaN 12 NaN NaN
1 3 25 NaN HAGUE 1 19694 BVD INC Indian 22 27N ... 31.0 10 NaN 39.0 11 NaN 37.0 12 NaN 45.0
2 3 68 NaN ADAMS "A" 1-3 17441 CHESAPEAKE OPERATING LLC Indian 3 25N ... 0.0 10 NaN 0.0 11 NaN 0.0 12 NaN NaN
3 3 71 NaN NEWLIN 1 7775 COMBINED RESOURCES CORPORATION Indian 19 25N ... 1089.0 10 NaN 1089.0 11 NaN 873.0 12 NaN 512.0
4 3 73 NaN WOODWARD (VOSS) 1 11739 MACK ENERGY CO Indian 25 24N ... 608.0 10 NaN 468.0 11 NaN 344.0 12 NaN 857.0

5 rows × 66 columns


In [70]:
def filter_data(row):
    buffer = []
    for val in row:
        val_parsed = None
        try:
            val_parsed = int(val)
        except ValueError:
            val_parsed = 0
        buffer.append(val_parsed)
    return np.array(buffer, dtype=np.int32)

In [25]:
meta_dataframe = None
meta_prod_dfs = []
meta_data = {}
columns = ['API_NUMBER','API_COUNTY','LATITUDE', 'LONGITUDE', 'FORMATION']
for year in range(1987, 2016):
    print(year)
    if year != 1994:
        filter_col = columns
        yearly_meta_data = production_data[year]#.dropna()
        for i in range(1, len(yearly_meta_data.index)):
            row = yearly_meta_data.iloc[[i]]
            api_num = row["API_NUMBER"].values.astype(np.int32)[0]
            mdata = row[filter_col].values[0]
            if api_num in meta_data.keys():
                pass
            else:
                if not np.isnan(api_num):
                    meta_data[api_num] = {}
                    try:
                        meta_data[api_num]["API_COUNTY"] = int(mdata[1])
                        meta_data[api_num]["LATITUDE"] = float(mdata[2])
                        meta_data[api_num]["LONGITUDE"] = float(mdata[3])
                        form_str = str(mdata[4]).strip(" ")
                        meta_data[api_num]["FORMATION"] = form_str
                    except ValueError:
                        print("Found invalid value: ", api_num, year, mdata)


2011
Found invalid value:  -2147483648 2011 [nan nan nan nan nan]
2012
2013
2014
2015

In [29]:
del meta_data[-2147483648 ]

In [31]:
meta_out = {}
for key in meta_data.keys():
    meta_out[str(key)] = meta_data[key]

In [33]:
with open('../processed/immutable/immutable.json', 'w') as fp:
    json.dump(meta_out, fp, sort_keys=True)

In [ ]:


In [ ]: