In [1]:
from vega_datasets import data
movies_data = data.movies()
movies_data.head()


Out[1]:
Title US_Gross Worldwide_Gross US_DVD_Sales Production_Budget Release_Date MPAA_Rating Running_Time_min Distributor Source Major_Genre Creative_Type Director Rotten_Tomatoes_Rating IMDB_Rating IMDB_Votes
0 The Land Girls 146083.0 146083.0 NaN 8000000.0 Jun 12 1998 R NaN Gramercy None None None None NaN 6.1 1071.0
1 First Love, Last Rites 10876.0 10876.0 NaN 300000.0 Aug 07 1998 R NaN Strand None Drama None None NaN 6.9 207.0
2 I Married a Strange Person 203134.0 203134.0 NaN 250000.0 Aug 28 1998 None NaN Lionsgate None Comedy None None NaN 6.8 865.0
3 Let's Talk About Sex 373615.0 373615.0 NaN 300000.0 Sep 11 1998 None NaN Fine Line None Comedy None None 13.0 NaN NaN
4 Slam 1009819.0 1087521.0 NaN 1000000.0 Oct 09 1998 R NaN Trimark Original Screenplay Drama Contemporary Fiction None 62.0 3.4 165.0

In [45]:
from vega_datasets import data
movies_data = data.movies()
import seaborn as sns
import matplotlib.pyplot as plt
sns.scatterplot(x="Production_Budget",y="US_DVD_Sales",hue="Major_Genre",  data=movies_data,)
plt.title("Production Budget Vs. US DVD Sales - Genre")
plt.xlabel("Production Budget")
plt.ylabel("US DVD Sales")
plt.show()



In [0]: