spark python例子

来源:互联网 发布:出知益州 时李顺构乱 编辑:程序博客网 时间:2024/06/06 01:07
# -*- coding: utf-8 -*-from __future__ import print_functionimport sysfrom operator import addfrom pyspark import SparkContext#./pyspark /home/yunshouhu/PycharmProjects/untitled/word.py /home/yunshouhu/PycharmProjects/untitled/data.txtif __name__=="__main__":    if len(sys.argv)!=2:        print ("useg: word <file>",file=sys.stderr);        exit(-1)    sc=SparkContext(appName="myword")    lines=sc.textFile(sys.argv[1],1)    counts=lines.flatMap(lambda x:x.split(' ')).map(lambda x:(x,1)).reduceByKey(add)    output=counts.collect();    for (word,count) in output:        print("来自中国: %s %i" % (word,count))    sc.stop()

0 0