In [3]:
import json
jsonFile = open('request.json', 'r')
full_json = ""
for line in jsonFile:
full_json+=line
values = json.loads(full_json)
In [7]:
import random
import pandas as pd
In [8]:
longitude = []
latitude = []
username= []
report_type = []
content = []
data_source = []
data_source_choices = ['TF','AP']
report_type_choices = ['ASSAULT', 'TEASING', 'GROPED', 'DRUGGED', 'RAPED']
for line in values['statuses']:
if line['geo'] is not None:
username.append(line['user']['screen_name'])
report_type.append(random.choice(report_type_choices))
latitude.append(line['geo']['coordinates'][0])
longitude.append(line['geo']['coordinates'][1])
content.append(line['text'])
data_source.append(random.choice(data_source_choices))
tweet_list = pd.DataFrame(
{'username': username,
'latitude': latitude,
'longitude': longitude,
'report_type':report_type,
'report_content':content,
'data_source':data_source
})
In [14]:
tweet_list.to_csv('data.csv', sep='|')
In [ ]: