In [1]:
:extension DeriveGeneric
:extension FlexibleContexts
:extension OverloadedStrings
:extension GeneralizedNewtypeDeriving
:extension FlexibleInstances
:extension MultiParamTypeClasses
In [2]:
import GHC.Generics (Generic)
import Spark.Core.Dataset
import Spark.Core.Context
import Spark.Core.Functions
import Spark.Core.Column
import Spark.Core.Types
import Spark.Core.Row
import Spark.Core.ColumnFunctions
conf = defaultConf {
confEndPoint = "http://10.0.2.2",
confRequestedSessionName = "session05_python" }
createSparkSessionDef conf
In [3]:
import Spark.Core.Types
In [4]:
data MyData = MyData {
aBigId :: Int,
importantData :: Int } deriving (Show, Eq, Generic, Ord)
instance SQLTypeable MyData
instance FromSQL MyData
instance ToSQL MyData
In [5]:
let collection = [MyData 1 2, MyData 3 2, MyData 5 4]
let ds = dataset collection @@ "dataset"
let c = collect (asCol ds) @@ "collected_data"
_ <- exec1Def c
In [2]:
from kraps import *
ks = connectSession("session05_python", address='localhost')
ks
In [ ]:
ks.pandas("collected_data")
In [ ]:
print ks.url('collected_data')
In [ ]: