In [1]:
import pandas as pd
import numpy as np
In [2]:
legislatorsData = pd.read_csv("../data/legislators.csv")
legislatorsData.head()
legislatorsData.columns
legislators = pd.DataFrame(legislatorsData)
legislators.head()
Out[2]:
In [3]:
legislators.columns.tolist()
Out[3]:
In [4]:
print legislators.bioguide_id.head()
l_bioGuides = legislators.bioguide_id.tolist()
l_bioGuides[:3]
print "Bio Guides available for the congress :", len(l_bioGuides)
In [5]:
from urllib2 import Request, urlopen
import json
from pandas.io.json import json_normalize
request=Request('http://capitolwords.org/api/1/phrases.json?entity_type=month&entity_value=201007&sort=count+desc&apikey=0bf8e7eb6ce146f48217bfee767c998d')
response = urlopen(request)
contents = response.read()
data = json.loads(contents)
print "Example object and query to the sunlight API:"
print data[:5]
In [6]:
first_table_ever = json_normalize(data)
print "After converting the content of the request in to a DataFrame\n Popular words of the month \n 100 only prionting a few:"
print "The shape is: ",first_table_ever.shape
first_table_ever.head(8)
Out[6]:
In [7]:
print "Yes they are unique"
len(first_table_ever.ngram.unique())
Out[7]:
In [8]:
print "One legislator fav words"
request=Request('http://capitolwords.org/api/1/phrases.json?entity_type=legislator&entity_value=L000551&apikey=0bf8e7eb6ce146f48217bfee767c998d')
response = urlopen(request)
contents = response.read()
data = json.loads(contents)
print data[:5]
len(data)
Out[8]:
In [9]:
legislator_example = json_normalize(data)
legislator_example.head()
list_of_words = legislator_example.ngram.tolist()
favorite_words ="|".join(list_of_words)
print "list of favorite words of a legislator:"
favorite_words
Out[9]:
In [10]:
legislators_option1 = legislators
def requestWords( id ):
id = str(id)
url = "http://capitolwords.org/api/1/phrases.json?entity_type=legislator&entity_value="+id+"&apikey=0bf8e7eb6ce146f48217bfee767c998d"
request=Request(url)
response = urlopen(request)
contents = response.read()
len(contents)
if len(contents) > 2:
data = json.loads(contents)
words = json_normalize(data)
list_of_words = words.ngram.tolist()
string_of_words ="|".join(list_of_words)
return string_of_words
else:
return np.nan
requestWords(id ="A000369")
Out[10]:
In [11]:
legislators_option1.dtypes
legislators_option1.bioguide_id.astype(str)
legislators_option1.dtypes
legislators_option1['favorite_words'] = legislators_option1.apply(lambda row: requestWords(row['bioguide_id']),axis=1)
In [12]:
legislators_option1.favorite_words.head(20)
Out[12]:
In [23]:
# Beneficiaries for events:
def requestBeneficiaries( id ):
id = str(id)
url = "/politicalpartytime.org/api/v1/event/?format=json&beneficiaries__crp_id="+id+"&apikey=0bf8e7eb6ce146f48217bfee767c998d"
request=Request(url)
response = urlopen(request)
print response
if len(contents) > 2:
data = json.loads(contents)
beneficiary = json_normalize(data)
#words = json_normalize(data)
#list_of_words = words.ngram.tolist()
#string_of_words ="|".join(list_of_words)
#return string_of_words
else:
return np.nan
requestBeneficiaries(id ="N00003675")
In [ ]: