scala的wordcount

import org.apache.spark.{SparkConf, SparkContext}
import org.apache.spark.sql.SparkSession

object WordCount {

  def main(args:Array[String]): Unit ={
 
    val conf = new SparkConf()
      .setAppName("WordCount");
    val sc = new SparkContext(conf)

    val lines = sc.textFile("file:/D:/data/test");
    val words = lines.flatMap { line => line.split(" ")}
    val pairs = words.map {word => (word, 1)}
    val wordCount = pairs.reduceByKey(_ + _)
    wordCount.foreach(wordCount => println(wordCount._1 + " " + wordCount._2))
    
  }
}
原文地址:https://www.cnblogs.com/timlong/p/10002305.html