In [1]:
sc.addPyFile('magichour.zip')
In [2]:
from magichour.api.dist.templates.templateEval import templateEvalRDD
In [3]:
transformURI = 'hdfs://namenode/magichour/simpleTrans'
templateURI = 'hdfs://namenode/magichour/templates'
logInURI = 'hdfs://namenode/magichour/tbird.500k.gz'
logOUTURI = 'hdfs://namenode/magichour/tbird.500.templateEvalRDD'
In [4]:
test = templateEvalRDD(sc,logInURI,transformURI,templateURI)
In [5]:
test.saveAsPickleFile(logOUTURI)
In [ ]:
test.take(10)
In [ ]: