We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7bcccc9 commit 43f7883Copy full SHA for 43f7883
pairRdd/aggregation/reducebykey/WordCount.py
@@ -0,0 +1,14 @@
1
+from pyspark import SparkContext
2
+
3
+if __name__ == "__main__":
4
5
+ sc = SparkContext("local", "wordCounts")
6
+ sc.setLogLevel("ERROR")
7
8
+ lines = sc.textFile("in/word_count.text")
9
+ wordRdd = lines.flatMap(lambda line: line.split(" "))
10
+ wordPairRdd = wordRdd.map(lambda word: (word, 1))
11
12
+ wordCounts = wordPairRdd.reduceByKey(lambda x, y: x + y)
13
+ for word, count in wordCounts.collect():
14
+ print("{} : {}".format(word, count))
0 commit comments