In [1]:
library(SparkR)
In [2]:
sc <- sparkR.init("local[*]", "SparkR", sparkPackages="com.databricks:spark-csv_2.10:1.5.0")
sqlContext <- sparkRSQL.init(sc)
In [3]:
schema <- structType(structField("tag", "string"), structField("x", "double"), structField("y", "double"))
In [4]:
points <- read.df(sqlContext, "/opt/points.txt", source = "com.databricks.spark.csv", schema = schema)
print(collect(points))
In [5]:
registerTempTable(points, "points")
sql = "SELECT * FROM points WHERE POINT(x, y) IN CIRCLERANGE(POINT(4.5, 4.5), 2)"
print(collect(sql(sqlContext,sql)))
In [ ]: