In [3]:
import pandas as pd
In [ ]:
def convert_json_to_csv(json_file_dir, csv_file_dir):
for filename in os.listdir(json_file_dir):
if filename.endswith('.json'):
try:
pd.read_json(os.path.join(json_file_dir, filename), lines=True).to_csv(os.path.join(csv_file_path, filename.replace('.json', '.csv')), encoding='utf-8', index=False)
except:
print filename + 'error\n'
convert_json_to_csv('/home/amlanlimaye/yelp-dataset-challenge/data/raw/', '/home/amlanlimaye/yelp-dataset-challenge/data/interim/original_csv/')
In [5]:
# pd.read_json('../../data/raw/yelp_academic_dataset_business.json', lines=True).to_csv('../../data/interim/original_csv/business.csv', encoding='utf-8', index=False)
# pd.read_json('../../data/raw/yelp_academic_dataset_checkin.json', lines=True).to_csv('../../data/interim/original_csv/checkin.csv', encoding='utf-8', index=False)
# pd.read_json('../../data/raw/yelp_academic_dataset_review.json', lines=True).to_csv('../../data/interim/original_csv/review.csv', encoding='utf-8', index=False)
# pd.read_json('../../data/raw/yelp_academic_dataset_tip.json', lines=True).to_csv('../../data/interim/original_csv/tip.csv', encoding='utf-8', index=False)
# pd.read_json('../../data/raw/yelp_academic_dataset_user.json', lines=True).to_csv('../../data/interim/original_csv/user.csv', encoding='utf-8', index=False)