In [198]:
import plotly.plotly as pl
import plotly.graph_objs as go
import plotly.offline as po
import matplotlib.pyplot as plt
import mpl_toolkits.basemap as bm
import pandas as pd
import numpy as np
import seaborn as sns

po.init_notebook_mode()
%pylab inline


Populating the interactive namespace from numpy and matplotlib

In [2]:
PATH_TO_DATASETS = '../yelp_dataset/'
df_businesses = pd.read_csv(PATH_TO_DATASETS + 'businesses.csv', sep=',', encoding='utf-8')
df_checkins = pd.read_csv(PATH_TO_DATASETS + 'checkins.csv', sep=',', encoding='utf-8')
df_reviews = pd.read_csv(PATH_TO_DATASETS + 'reviews.csv', sep=',', encoding='utf-8')
df_users = pd.read_csv(PATH_TO_DATASETS + 'users.csv', sep=',', encoding='utf-8')
df_tips = pd.read_csv(PATH_TO_DATASETS + 'tips.csv', sep=',', encoding='utf-8')

In [3]:
df_businesses.head(1)


Out[3]:
business_id city full_address latitude longitude name open review_count stars state ... hour_saturday_open hour_sunday_close hour_sunday_open hour_thursday_close hour_thursday_open hour_tuesday_close hour_tuesday_open hour_wednesday_close hour_wednesday_open neighborhoods_count
0 vcNAWiLM4dR7D2nwwJ7nCA Phoenix 4840 E Indian School Rd\nSte 101\nPhoenix, AZ ... 33.499313 -111.983758 Eric Goldberg, MD True 9 3.5 AZ ... NaN NaN NaN 17:00 08:00 17:00 08:00 17:00 08:00 0

1 rows × 983 columns


In [4]:
print df_businesses.columns.tolist()


[u'business_id', u'city', u'full_address', u'latitude', u'longitude', u'name', u'open', u'review_count', u'stars', u'state', u'category_accessories', u'category_accountants', u'category_active_life', u'category_acupuncture', u'category_adult', u'category_adult_education', u'category_adult_entertainment', u'category_advertising', u'category_afghan', u'category_african', u'category_airlines', u'category_airport_lounges', u'category_airport_shuttles', u'category_airports', u'category_allergists', u'category_amateur_sports_teams', u'category_american_(new)', u'category_american_(traditional)', u'category_amusement_parks', u'category_anesthesiologists', u'category_animal_shelters', u'category_antiques', u'category_apartments', u'category_appliances', u'category_appliances_&_repair', u'category_aquarium_services', u'category_aquariums', u'category_arabian', u'category_arcades', u'category_archery', u'category_architects', u'category_argentine', u'category_art_classes', u'category_art_galleries', u'category_art_schools', u'category_art_supplies', u'category_arts_&_crafts', u'category_arts_&_entertainment', u'category_asian_fusion', u'category_auction_houses', u'category_audiologist', u'category_australian', u'category_austrian', u'category_auto_customization', u'category_auto_detailing', u'category_auto_glass_services', u'category_auto_loan_providers', u'category_auto_parts_&_supplies', u'category_auto_repair', u'category_automotive', u'category_baby_gear_&_furniture', u'category_baden', u'category_bagels', u'category_bail_bondsmen', u'category_bakeries', u'category_bangladeshi', u'category_bankruptcy_law', u'category_banks_&_credit_unions', u'category_barbeque', u'category_barbers', u'category_barre_classes', u'category_bars', u'category_bartenders', u'category_bartending_schools', u'category_basketball_courts', u'category_basque', u'category_battery_stores', u'category_batting_cages', u'category_bavarian', u'category_beaches', u'category_beauty_&_spas', u'category_bed_&_breakfast', u'category_beer_bar', u'category_beer_garden', u'category_beer_gardens', u'category_beer,_wine_&_spirits', u'category_belgian', u'category_bespoke_clothing', u'category_beverage_store', u'category_bike_rentals', u'category_bike_repair/maintenance', u'category_bike_sharing', u'category_bikes', u'category_bistros', u'category_blow_dry/out_services', u'category_boat_charters', u'category_boat_dealers', u'category_boat_repair', u'category_boating', u'category_body_shops', u'category_books,_mags,_music_&_video', u'category_bookstores', u'category_boot_camps', u'category_botanical_gardens', u'category_bowling', u'category_boxing', u'category_brasseries', u'category_brazilian', u'category_breakfast_&_brunch', u'category_breweries', u'category_brewing_supplies', u'category_bridal', u'category_british', u'category_bubble_tea', u'category_buddhist_temples', u'category_buffets', u'category_building_supplies', u'category_burgers', u'category_burmese', u'category_bus_tours', u'category_buses', u'category_business_law', u'category_butcher', u'category_cpr_classes', u'category_csa', u'category_cabaret', u'category_cabinetry', u'category_cafes', u'category_cafeteria', u'category_cajun/creole', u'category_cambodian', u'category_campgrounds', u'category_canadian_(new)', u'category_candy_stores', u'category_cannabis_clinics', u'category_cantonese', u'category_car_dealers', u'category_car_rental', u'category_car_share_services', u'category_car_stereo_installation', u'category_car_wash', u'category_cardiologists', u'category_cards_&_stationery', u'category_career_counseling', u'category_caribbean', u'category_carpet_cleaning', u'category_carpet_installation', u'category_carpeting', u'category_casinos', u'category_castles', u'category_caterers', u'category_challenge_courses', u'category_champagne_bars', u'category_check_cashing/pay_day_loans', u'category_cheese_shops', u'category_cheesesteaks', u'category_chicken_wings', u'category_child_care_&_day_care', u"category_children's_clothing", u'category_chimney_sweeps', u'category_chinese', u'category_chiropractors', u'category_chocolatiers_&_shops', u'category_christmas_markets', u'category_churches', u'category_cinema', u'category_climbing', u'category_clowns', u'category_cocktail_bars', u'category_coffee_&_tea', u'category_coffee_&_tea_supplies', u'category_coffeeshops', u'category_college_counseling', u'category_colleges_&_universities', u'category_colombian', u'category_comedy_clubs', u'category_comfort_food', u'category_comic_books', u'category_commercial_real_estate', u'category_community_service/non_profit', u'category_computers', u'category_contractors', u'category_convenience_stores', u'category_cooking_classes', u'category_cooking_schools', u'category_cosmetic_dentists', u'category_cosmetic_surgeons', u'category_cosmetics_&_beauty_supply', u'category_cosmetology_schools', u'category_costumes', u'category_counseling_&_mental_health', u'category_country_dance_halls', u'category_couriers_&_delivery_services', u'category_courthouses', u'category_creperies', u'category_criminal_defense_law', u'category_cuban', u'category_cultural_center', u'category_cupcakes', u'category_currency_exchange', u'category_curry_sausage', u'category_customized_merchandise', u'category_cycling_classes', u'category_czech', u'category_djs', u'category_dui_law', u'category_damage_restoration', u'category_dance_clubs', u'category_dance_schools', u'category_dance_studios', u'category_data_recovery', u'category_day_camps', u'category_day_spas', u'category_delicatessen', u'category_delis', u'category_dentists', u'category_department_stores', u'category_departments_of_motor_vehicles', u'category_dermatologists', u'category_desserts', u'category_diagnostic_imaging', u'category_diagnostic_services', u'category_dim_sum', u'category_diners', u'category_disc_golf', u'category_discount_store', u'category_distilleries', u'category_dive_bars', u'category_diving', u'category_divorce_&_family_law', u'category_do_it_yourself_food', u'category_doctors', u'category_dog_parks', u'category_dog_walkers', u'category_dominican', u'category_donairs', u'category_donuts', u'category_door_sales/installation', u'category_doulas', u'category_driving_schools', u'category_drugstores', u'category_dry_cleaning_&_laundry', u'category_drywall_installation_&_repair', u'category_ear_nose_&_throat', u'category_eastern_european', u'category_eastern_german', u'category_education', u'category_educational_services', u'category_egyptian', u'category_electricians', u'category_electronics', u'category_electronics_repair', u'category_elementary_schools', u'category_embroidery_&_crochet', u'category_employment_agencies', u'category_employment_law', u'category_endocrinologists', u'category_endodontists', u'category_estate_planning_law', u'category_ethiopian', u'category_ethnic_food', u'category_ethnic_grocery', u'category_event_photography', u'category_event_planning_&_services', u'category_eyelash_service', u'category_eyewear_&_opticians', u'category_fabric_stores', u'category_face_painting', u'category_falafel', u'category_family_practice', u'category_farmers_market', u'category_fashion', u'category_fast_food', u'category_fences_&_gates', u'category_fertility', u'category_festivals', u'category_filipino', u'category_financial_advising', u'category_financial_services', u'category_fire_protection_services', u'category_firearm_training', u'category_fireplace_services', u'category_firewood', u'category_fireworks', u'category_first_aid_classes', u'category_fish_&_chips', u'category_fishing', u'category_fitness_&_instruction', u'category_flea_markets', u'category_flight_instruction', u'category_flooring', u'category_florists', u'category_flowers', u'category_flowers_&_gifts', u'category_fondue', u'category_food', u'category_food_banks', u'category_food_court', u'category_food_delivery_services', u'category_food_stands', u'category_food_tours', u'category_food_trucks', u'category_formal_wear', u'category_framing', u'category_french', u'category_fruits_&_veggies', u'category_funeral_services_&_cemeteries', u'category_furniture_repair', u'category_furniture_reupholstery', u'category_furniture_stores', u'category_garage_door_services', u'category_gardeners', u'category_gas_&_service_stations', u'category_gastroenterologist', u'category_gastropubs', u'category_gay_bars', u'category_gelato', u'category_general_dentistry', u'category_general_festivals', u'category_general_litigation', u'category_german', u'category_gift_shops', u'category_glass_&_mirrors', u'category_gluten_free', u'category_go_karts', u'category_gold_buyers', u'category_golf', u'category_golf_equipment', u'category_golf_equipment_shops', u'category_graphic_design', u'category_greek', u'category_grocery', u'category_guest_houses', u'category_gun/rifle_ranges', u'category_guns_&_ammo', u'category_gutter_services', u'category_gymnastics', u'category_gyms', u'category_hair_extensions', u'category_hair_removal', u'category_hair_salons', u'category_hair_stylists', u'category_haitian', u'category_halal', u'category_handyman', u'category_hang_gliding', u'category_hardware_stores', u'category_hats', u'category_hawaiian', u'category_health_&_medical', u'category_health_markets', u'category_health_retreats', u'category_hearing_aid_providers', u'category_heating_&_air_conditioning/hvac', u'category_herbs_&_spices', u'category_high_fidelity_audio_equipment', u'category_hiking', u'category_himalayan/nepalese', u'category_hindu_temples', u'category_hobby_shops', u'category_home_&_garden', u'category_home_cleaning', u'category_home_decor', u'category_home_health_care', u'category_home_inspectors', u'category_home_organization', u'category_home_services', u'category_home_staging', u'category_home_theatre_installation', u'category_home_window_tinting', u'category_hookah_bars', u'category_horse_boarding', u'category_horse_racing', u'category_horseback_riding', u'category_hospice', u'category_hospitals', u'category_hostels', u'category_hot_air_balloons', u'category_hot_dogs', u'category_hot_pot', u'category_hot_tub_&_pool', u'category_hotels', u'category_hotels_&_travel', u'category_hungarian', u'category_hypnosis/hypnotherapy', u'category_it_services_&_computer_repair', u'category_iberian', u'category_ice_cream_&_frozen_yogurt', u'category_immigration_law', u'category_indian', u'category_indonesian', u'category_insulation_installation', u'category_insurance', u'category_interior_design', u'category_internal_medicine', u'category_international', u'category_internet_cafes', u'category_internet_service_providers', u'category_investing', u'category_irish', u'category_irish_pub', u'category_irrigation', u'category_italian', u'category_izakaya', u'category_japanese', u'category_jazz_&_blues', u'category_jewelry', u'category_jewelry_repair', u'category_juice_bars_&_smoothies', u'category_junk_removal_&_hauling', u'category_karaoke', u'category_kebab', u'category_keys_&_locksmiths', u'category_kids_activities', u'category_kitchen_&_bath', u'category_knitting_supplies', u'category_korean', u'category_kosher', u'category_laboratory_testing', u'category_lactation_services', u'category_lakes', u'category_landmarks_&_historical_buildings', u'category_landscape_architects', u'category_landscaping', u'category_language_schools', u'category_laotian', u'category_laser_eye_surgery/lasik', u'category_laser_hair_removal', u'category_laser_tag', u'category_latin_american', u'category_lawyers', u'category_leather_goods', u'category_lebanese', u'category_legal_services', u'category_leisure_centers', u'category_libraries', u'category_lice_services', u'category_life_coach', u'category_lighting_fixtures_&_equipment', u'category_limos', u'category_lingerie', u'category_live/raw_food', u'category_local_flavor', u'category_local_services', u'category_lounges', u'category_luggage', u'category_magicians', u'category_mailbox_centers', u'category_makeup_artists', u'category_malaysian', u'category_marketing', u'category_martial_arts', u'category_masonry/concrete', u'category_mass_media', u'category_massage', u'category_massage_schools', u'category_massage_therapy', u'category_matchmakers', u'category_maternity_wear', u'category_mattresses', u'category_meat_shops', u'category_medical_centers', u'category_medical_spas', u'category_medical_supplies', u'category_medical_transportation', u'category_meditation_centers', u'category_mediterranean', u"category_men's_clothing", u"category_men's_hair_salons", u'category_metal_fabricators', u'category_mexican', u'category_middle_eastern', u'category_middle_schools_&_high_schools', u'category_midwives', u'category_mini_golf', u'category_mobile_phone_repair', u'category_mobile_phones', u'category_modern_european', u'category_mongolian', u'category_moroccan', u'category_mortgage_brokers', u'category_mosques', u'category_motorcycle_dealers', u'category_motorcycle_gear', u'category_motorcycle_rental', u'category_motorcycle_repair', u'category_mountain_biking', u'category_movers', u'category_museums', u'category_music_&_dvds', u'category_music_venues', u'category_musical_instrument_services', u'category_musical_instruments_&_teachers', u'category_musicians', u'category_nail_salons', u'category_nanny_services', u'category_naturopathic/holistic', u'category_neurologist', u'category_newspapers_&_magazines', u'category_nightlife', u'category_notaries', u'category_nurseries_&_gardening', u'category_nutritionists', u'category_obstetricians_&_gynecologists', u'category_occupational_therapy', u'category_office_cleaning', u'category_office_equipment', u'category_officiants', u'category_oil_change_stations', u'category_oncologist', u'category_opera_&_ballet', u'category_ophthalmologists', u'category_optometrists', u'category_oral_surgeons', u'category_organic_stores', u'category_oriental', u'category_orthodontists', u'category_orthopedists', u'category_orthotics', u'category_osteopathic_physicians', u'category_outdoor_gear', u'category_outlet_stores', u'category_paddleboarding', u'category_paintball', u'category_painters', u'category_pakistani', u'category_parking', u'category_parks', u'category_party_&_event_planning', u'category_party_bus_rentals', u'category_party_equipment_rentals', u'category_party_supplies', u'category_pasta_shops', u'category_patisserie/cake_shop', u'category_pawn_shops', u'category_payroll_services', u'category_pediatric_dentists', u'category_pediatricians', u'category_performing_arts', u'category_periodontists', u'category_permanent_makeup', u'category_persian/iranian', u'category_personal_assistants', u'category_personal_chefs', u'category_personal_injury_law', u'category_personal_shopping', u'category_peruvian', u'category_pest_control', u'category_pet_adoption', u'category_pet_boarding/pet_sitting', u'category_pet_groomers', u'category_pet_services', u'category_pet_stores', u'category_pet_training', u'category_pets', u'category_pharmacy', u'category_photo_booth_rentals', u'category_photographers', u'category_photography_stores_&_services', u'category_physical_therapy', u'category_piano_bars', u'category_piano_services', u'category_piercing', u'category_pilates', u'category_pita', u'category_pizza', u'category_playgrounds', u'category_plumbing', u'category_plus_size_fashion', u'category_podiatrists', u'category_pole_dancing_classes', u'category_police_departments', u'category_polish', u'category_pool_&_hot_tub_service', u'category_pool_cleaners', u'category_pool_halls', u'category_pop_up_shops', u'category_portuguese', u'category_post_offices', u'category_poutineries', u'category_powder_coating', u'category_preschools', u'category_pressure_washers', u'category_pretzels', u'category_print_media', u'category_printing_services', u'category_private_investigation', u'category_private_tutors', u'category_professional_services', u'category_professional_sports_teams', u'category_propane', u'category_property_management', u'category_prosthetics', u'category_psychiatrists', u'category_psychics_&_astrologers', u'category_psychologists', u'category_pub_food', u'category_public_plazas', u'category_public_services_&_government', u'category_public_transportation', u'category_pubs', u'category_pulmonologist', u'category_rv_dealers', u'category_rv_parks', u'category_rv_rental', u'category_rv_repair', u'category_race_tracks', u'category_radio_stations', u'category_radiologists', u'category_rafting/kayaking', u'category_ramen', u'category_real_estate', u'category_real_estate_agents', u'category_real_estate_law', u'category_real_estate_services', u'category_recording_&_rehearsal_studios', u'category_recreation_centers', u'category_recycling_center', u'category_refinishing_services', u'category_reflexology', u'category_registration_services', u'category_rehabilitation_center', u'category_reiki', u'category_religious_organizations', u'category_religious_schools', u'category_resorts', u'category_restaurants', u'category_retirement_homes', u'category_rheumatologists', u'category_rock_climbing', u'category_rolfing', u'category_roofing', u'category_rugs', u'category_russian', u'category_salad', u'category_salvadoran', u'category_sandwiches', u'category_saunas', u'category_scandinavian', u'category_scottish', u'category_screen_printing', u'category_screen_printing/t_shirt_printing', u'category_scuba_diving', u'category_seafood', u'category_seafood_markets', u'category_security_services', u'category_security_systems', u'category_self_storage', u'category_septic_services', u'category_serbo_croatian', u'category_session_photography', u'category_sewing_&_alterations', u'category_shades_&_blinds', u'category_shanghainese', u'category_shared_office_spaces', u'category_shaved_ice', u'category_shipping_centers', u'category_shoe_repair', u'category_shoe_stores', u'category_shopping', u'category_shopping_centers', u'category_shredding_services', u'category_shutters', u'category_signmaking', u'category_singaporean', u'category_skate_parks', u'category_skating_rinks', u'category_ski_resorts', u'category_skin_care', u'category_skydiving', u'category_smog_check_stations', u'category_soccer', u'category_social_clubs', u'category_solar_installation', u'category_soul_food', u'category_soup', u'category_southern', u'category_souvenir_shops', u'category_spanish', u'category_special_education', u'category_specialty_food', u'category_specialty_schools', u'category_speech_therapists', u'category_sporting_goods', u'category_sports_bars', u'category_sports_clubs', u'category_sports_medicine', u'category_sports_wear', u'category_spray_tanning', u'category_stadiums_&_arenas', u'category_steakhouses', u'category_street_art', u'category_street_vendors', u'category_sugaring', u'category_summer_camps', u'category_surf_shop', u'category_surfing', u'category_surgeons', u'category_sushi_bars', u'category_swimming_lessons/schools', u'category_swimming_pools', u'category_swimwear', u'category_swiss_food', u'category_synagogues', u'category_szechuan', u'category_tai_chi', u'category_taiwanese', u'category_talent_agencies', u'category_tanning', u'category_tanning_beds', u'category_tapas_bars', u'category_tapas/small_plates', u'category_tattoo', u'category_tattoo_removal', u'category_tax_services', u'category_taxis', u'category_tea_rooms', u'category_telecommunications', u'category_television_service_providers', u'category_television_stations', u'category_tennis', u'category_teppanyaki', u'category_test_preparation', u'category_tex_mex', u'category_thai', u'category_thrift_stores', u'category_ticket_sales', u'category_tires', u'category_tobacco_shops', u'category_tours', u'category_towing', u'category_toy_stores', u'category_traditional_chinese_medicine', u'category_train_stations', u'category_trainers', u'category_trains', u'category_trampoline_parks', u'category_transportation', u'category_travel_services', u'category_tree_services', u'category_trinidadian', u'category_trophy_shops', u'category_truck_rental', u'category_turkish', u'category_tutoring_centers', u'category_ukrainian', u'category_uniforms', u'category_university_housing', u'category_urgent_care', u'category_urologists', u'category_used_bookstore', u'category_used,_vintage_&_consignment', u'category_utilities', u'category_uzbek', u'category_vacation_rental_agents', u'category_vacation_rentals', u'category_valet_services', u'category_vape_shops', u'category_vegan', u'category_vegetarian', u'category_venezuelan', u'category_venues_&_event_spaces', u'category_veterinarians', u'category_video_game_stores', u'category_video/film_production', u'category_videographers', u'category_videos_&_video_game_rental', u'category_vietnamese', u'category_vinyl_records', u'category_vocational_&_technical_school', u'category_walk_in_clinics', u'category_walking_tours', u'category_watch_repair', u'category_watches', u'category_water_delivery', u'category_waxing', u'category_web_design', u'category_wedding_planning', u'category_weight_loss_centers', u'category_wheel_&_rim_repair', u'category_wholesale_stores', u'category_wigs', u'category_window_washing', u'category_windows_installation', u'category_windshield_installation_&_repair', u'category_wine_bars', u'category_wine_tours', u'category_wineries', u'category_wok', u"category_women's_clothing", u'category_yelp_events', u'category_yoga', u'category_zoos', u'neighborhood_allentown', u"neighborhood_allied_dunn's_marsh", u'neighborhood_anthem', u'neighborhood_arboretum', u'neighborhood_aspinwall', u'neighborhood_avalon', u'neighborhood_ballantyne', u'neighborhood_banksville', u'neighborhood_bay_creek', u'neighborhood_beechview', u'neighborhood_bellevue', u'neighborhood_berkley_oaks', u'neighborhood_biddleville', u'neighborhood_bloomfield', u'neighborhood_bluff_acres', u'neighborhood_bon_air', u"neighborhood_bram's_addition", u'neighborhood_brighton_heights', u'neighborhood_brookline', u'neighborhood_bruntsfield', u'neighborhood_burke_heights', u'neighborhood_burr_oaks', u'neighborhood_cannonmills', u'neighborhood_capitol', u'neighborhood_capitol_view_heights', u'neighborhood_carnegie', u'neighborhood_carpenter_ridgeway', u'neighborhood_carrick', u'neighborhood_centennial', u'neighborhood_chinatown', u'neighborhood_cotswold', u'neighborhood_crafton_heights', u'neighborhood_derita', u'neighborhood_dilworth', u'neighborhood_dormont', u'neighborhood_downtown', u'neighborhood_dudgeon_monroe', u'neighborhood_duquesne_heights', u'neighborhood_east_carnegie', u'neighborhood_east_liberty', u'neighborhood_eastland', u'neighborhood_eastmorland', u'neighborhood_eastside', u'neighborhood_eken_park', u'neighborhood_elizabeth', u'neighborhood_elvehjem', u'neighborhood_emerson_east', u'neighborhood_etna', u'neighborhood_faircrest', u'neighborhood_fairywood', u'neighborhood_first_ward', u'neighborhood_fourth_ward', u'neighborhood_friendship', u'neighborhood_garfield', u'neighborhood_glacier_ridge', u'neighborhood_glen_oak_hills', u'neighborhood_glendale', u'neighborhood_grassmarket', u'neighborhood_greenbush', u'neighborhood_greenfield', u'neighborhood_greentree', u"neighborhood_hawk's_landing", u'neighborhood_hawthorne', u'neighborhood_haymarket', u'neighborhood_hays', u'neighborhood_hazelwood', u'neighborhood_heistand', u'neighborhood_high_crossing', u'neighborhood_highland_creek', u'neighborhood_highland_park', u'neighborhood_homestead', u'neighborhood_homewood', u'neighborhood_junction_ridge', u'neighborhood_knoxville', u'neighborhood_lake_edge', u'neighborhood_lake_view_hill', u'neighborhood_larimer', u'neighborhood_lawrenceville', u'neighborhood_leith', u'neighborhood_leopold', u'neighborhood_lincoln', u'neighborhood_maple___prairie', u'neighborhood_maple_wood', u'neighborhood_marbella', u'neighborhood_marchmont', u'neighborhood_mayfair_park', u'neighborhood_mcclellan_park', u'neighborhood_meadowood', u'neighborhood_midvale_heights_community', u'neighborhood_millvale', u'neighborhood_moorland___rimrock', u'neighborhood_morningside', u'neighborhood_mt__oliver', u'neighborhood_mt__washington', u'neighborhood_myers_park', u'neighborhood_new_town', u'neighborhood_newington', u'neighborhood_noda', u'neighborhood_nobel_park', u'neighborhood_norman_acres', u'neighborhood_north_charlotte', u'neighborhood_north_side', u'neighborhood_northwest', u'neighborhood_oakbridge_community', u'neighborhood_oakland', u'neighborhood_observatory_hill', u'neighborhood_old_middleton_greenway', u'neighborhood_old_town', u'neighborhood_orchard_ridge_community', u'neighborhood_overbrook', u'neighborhood_paw_creek', u'neighborhood_plaza_midwood', u'neighborhood_point_breeze', u'neighborhood_polish_hill', u'neighborhood_quail_hollow', u'neighborhood_regent', u'neighborhood_regent_square', u'neighborhood_ridgewood', u'neighborhood_rolling_meadows', u'neighborhood_royal_mile', u'neighborhood_sauk_creek', u'neighborhood_schenk___atwood', u'neighborhood_sedgefield', u'neighborhood_shadyside', u'neighborhood_sharpsburg', u'neighborhood_sheraden', u'neighborhood_sherman', u'neighborhood_sherwood_forest', u'neighborhood_south_campus', u'neighborhood_south_end', u'neighborhood_south_park', u'neighborhood_south_side', u'neighborhood_south_side_slopes', u'neighborhood_south_summerlin', u'neighborhood_southeast', u'neighborhood_southwest', u'neighborhood_spring_harbor', u'neighborhood_spring_valley', u'neighborhood_squirrel_hill', u'neighborhood_stanton_heights', u'neighborhood_starkweather___yahar', u'neighborhood_starmount', u'neighborhood_steele_creek', u'neighborhood_stockbridge', u'neighborhood_stone_meadows', u'neighborhood_strip_district', u'neighborhood_summerlin', u'neighborhood_summit_woods', u'neighborhood_sunrise', u'neighborhood_sunset_village', u'neighborhood_tenney___lapham', u'neighborhood_the_hill_district', u'neighborhood_the_lakes', u'neighborhood_the_meadows', u'neighborhood_the_strip', u'neighborhood_third_ward', u'neighborhood_tollcross', u'neighborhood_troy_hill', u'neighborhood_university', u'neighborhood_university_city', u'neighborhood_uptown', u'neighborhood_vilas', u'neighborhood_walnut_grove', u'neighborhood_waunona', u'neighborhood_west_end', u'neighborhood_west_view', u'neighborhood_westchester_gardens', u'neighborhood_westhaven_trails', u'neighborhood_westmorland', u'neighborhood_westside', u'neighborhood_wexford', u'neighborhood_williamson___marquette', u'neighborhood_willy_st', u'neighborhood_windgap', u'neighborhood_worthington_park', u'hour_friday_close', u'hour_friday_open', u'hour_monday_close', u'hour_monday_open', u'hour_saturday_close', u'hour_saturday_open', u'hour_sunday_close', u'hour_sunday_open', u'hour_thursday_close', u'hour_thursday_open', u'hour_tuesday_close', u'hour_tuesday_open', u'hour_wednesday_close', u'hour_wednesday_open', u'neighborhoods_count']

In [213]:
fig = plt.figure(figsize=(18, 12))
m = bm.Basemap(projection='cyl', llcrnrlat=-90, urcrnrlat=90, llcrnrlon=-180, urcrnrlon=180, resolution='c')
m.drawcountries(linewidth=0.2)
m.fillcontinents(color='lavender', lake_color='#000040')
m.drawmapboundary(linewidth=0.2, fill_color='#000040')
m.drawparallels(np.arange(-90, 90, 30), labels=[0, 0, 0, 0], color='white', linewidth=0.5)
m.drawmeridians(np.arange(0, 360, 30), labels=[0, 0, 0, 0], color='white', linewidth=0.5)
m.plot(df_businesses['longitude'], df_businesses["latitude"], 'o', markersize=20, latlon=True, color='red', alpha=0.5, label="Business")
plt.title("Geo distribution of businesses")
plt.legend(frameon=1).get_frame().set_facecolor("white")
plt.show()


Большинство предприятий в США. Некоторая часть в Германии и Великобритании.


In [196]:
states_dist = df_businesses.groupby('state').size()
states_dist.sort_values(inplace=True, ascending=False)
states_dist.plot(kind='bar', figsize=(16, 6), fontsize=13, title='Businesses distribution over states')
plt.xticks(rotation=0)
lbls = plt.xlabel('State'), plt.ylabel('Count')


Большинство предприятий в Аризоне (AZ) и Неваде (NV). Не меньше тысячи в Северной Каролине (NC), Квебеке (QC, Canada), Пенсильвании (PA), Эльдорадо Хилз (EDH, CA) и Вайоминге (WI).


In [109]:
open_dist = df_businesses.groupby('open').size()
open_dist.plot(kind='pie', figsize=(7, 7), fontsize=13, title='Open?', autopct='%1.1f%%', legend=True, explode=(0.05, 0))


Out[109]:
<matplotlib.axes._subplots.AxesSubplot at 0x22e1b1e50>

12% предприятий не работают :(


In [110]:
df_users.head(1)


Out[110]:
user_id name friends_count fans review_count average_stars yelping_since compliment_cool compliment_cute compliment_funny ... elite_at_2009 elite_at_2010 elite_at_2011 elite_at_2012 elite_at_2013 elite_at_2014 elite_at_2015 friends elite_total was_elite
0 18kPq7GPye-YQ3LyKyAZPw Russel 206 69 108 4.14 2004-10 78 15 11 ... 0 0 0 0 0 0 0 rpOyqD_893cqmDAtJLbdog,4U9kSBLuBDU391x6bxU-YA,... 2 True

1 rows × 35 columns


In [111]:
print df_users.columns.tolist()


[u'user_id', u'name', u'friends_count', u'fans', u'review_count', u'average_stars', u'yelping_since', u'compliment_cool', u'compliment_cute', u'compliment_funny', u'compliment_hot', u'compliment_list', u'compliment_more', u'compliment_note', u'compliment_photos', u'compliment_plain', u'compliment_profile', u'compliment_writer', u'vote_cool', u'vote_funny', u'vote_useful', u'elite_at_2005', u'elite_at_2006', u'elite_at_2007', u'elite_at_2008', u'elite_at_2009', u'elite_at_2010', u'elite_at_2011', u'elite_at_2012', u'elite_at_2013', u'elite_at_2014', u'elite_at_2015', u'friends', 'elite_total', 'was_elite']

In [217]:
df_users['elite_total'] = df_users[[u'elite_at_2005', u'elite_at_2006', u'elite_at_2007', u'elite_at_2008',
                                    u'elite_at_2009', u'elite_at_2010', u'elite_at_2011', u'elite_at_2012',
                                    u'elite_at_2013', u'elite_at_2014', u'elite_at_2015']].sum(axis=1).values.astype(int)
elite_total_dist = df_users.groupby('elite_total').size()
ax = elite_total_dist.plot(kind='bar', figsize=(16, 6), logy=True, fontsize=13, title='Users distribution over the number of elite years')
plt.xticks(rotation=0)
lbls = plt.xlabel('Elite Years'), plt.ylabel('Count')


Логарифмическая шкала, чтобы заметить элитных пользователей


In [215]:
df_users['was_elite'] = df_users['elite_total'].apply(lambda x: True if x > 0 else False)
was_elite_dist = df_users.groupby('was_elite').size()
was_elite_dist.plot(kind='pie', figsize=(7, 7), fontsize=13, title='Was Elite?', autopct='%1.1f%%', legend=True, explode=(0.05, 0))


Out[215]:
<matplotlib.axes._subplots.AxesSubplot at 0x21dc3c950>

Только 7% пользователей были элитными


In [197]:
yelping_since_dist = df_users.groupby('yelping_since').size()
ax = yelping_since_dist.plot(kind='bar', figsize=(16, 6), fontsize=13, title='User registration dynamic')
lbls = plt.xlabel('Year'), plt.ylabel('Count')
locs, labels = plt.xticks()
xtks = plt.xticks(locs[3::12], [i.get_text()[:4] for i in list(labels)][3::12], fontsize=13, rotation=45)


Пик притока новых пользователей приходится на 2011 год. В конце 2014 года наблюдается спад.


In [ ]:


In [ ]:


In [ ]: