In [1]:
from pyspark.sql import Row
In [2]:
points = sc.textFile("/opt/points.txt")\
.map(lambda line: line.split(","))\
.map(lambda p: Row(tag=p[0], x=float(p[1]), y=float(p[1])))
In [3]:
points = points.toDF()
points.show()
In [4]:
points.registerTempTable("points")
sql = "SELECT * FROM points WHERE POINT(x, y) IN CIRCLERANGE(POINT(4.5, 4.5), 2)"
sqlContext.sql(sql).show()
In [ ]: