def main():
conf = SparkConf().setMaster("local[2]").setAppName("YelpRecommender")
sc = SparkContext(conf=conf)
rdd_data = readElasticSearch(sc)
parsed_mapped_data = rdd_data.filter(location_recommender)
sorted_data = parsed_mapped_data.top(150, key=lambda a: a[1]["stars"])
topn_data = copyUniqueData(sorted_data, 5)
printResult(topn_data)
clearElasticSearch()
sorted_rdd = sc.parallelize(topn_data)
es_data = sorted_rdd.map(remap_es)
es_data.saveAsNewAPIHadoopFile(path='-',
outputFormatClass="org.elasticsearch.hadoop.mr.EsOutputFormat",
keyClass="org.apache.hadoop.io.NullWritable",
valueClass="org.elasticsearch.hadoop.mr.LinkedMapWritable",
conf={ "es.resource" : "yelpreco/resturant"})
recommender.py 文件源码
python
阅读 28
收藏 0
点赞 0
评论 0
评论列表
文章目录