本文最后更新于 2021-08-05 11:42:59
word-count
添加依赖
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
| <dependencies> <dependency> <groupId>org.apache.spark</groupId> <artifactId>spark-core_2.11</artifactId> <version>2.1.1</version> </dependency> </dependencies> <build> <plugins> <plugin> <groupId>net.alchim31.maven</groupId> <artifactId>scala-maven-plugin</artifactId> <version>3.4.6</version> <executions> <execution> <goals> <goal>compile</goal> <goal>testCompile</goal> </goals> </execution> </executions> </plugin> </plugins> </build>
|
scala
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
| object Hello { def main(args: Array[String]): Unit = { val conf = new SparkConf().setMaster("local[2]").setAppName("Hello") val sc = new SparkContext(conf)
val lineRDD = sc.textFile(args(0)) val resultRDD = lineRDD.flatMap(_.split(" ")) .map((_, 1)) .reduceByKey(_ + _) val worldCountArr = resultRDD.collect() worldCountArr.foreach(println) sc.stop() } }
|
05word-count
https://jiajun.xyz/2021/07/10/bigdata/10spark/05word-count/