notebook.community

Edit and run



In [1]:

    
import spark_jupyter



In [2]:

    
from pyspark import SparkContext, SQLContext
sc = SparkContext("local[*]", "Simple App")
hc = SQLContext(sc)



In [3]:

    
df = hc.createDataFrame([['a', 'b', 'c'],['e', 'f', 'g']], schema=['A', 'B', 'C'])
df.show()



In [4]:

    
df.printSchema()

Name	Type	Nullable
A	string	✓
B	string	✓
C	string	✓