Spark入门

安装:https://www.jianshu.com/p/0f4cc9ecc14c

第一个项目:Word Count

import org.apache.spark.{SparkConf, SparkContext}

object SparkWordCount {
  def FILE_NAME: String = "word_count_results_";

  def main(args: Array[String]) {
    val conf = new SparkConf().setAppName("Demo").setMaster("local");
    val sc = new SparkContext(conf);
    val textFile = sc.textFile("test.txt");
    val wordCounts = textFile.flatMap(line => line.split(" "))
                             .map(word => (word, 1)).reduceByKey((a, b) => a + b)

    println("Word Count program running results:");
    wordCounts.collect().foreach(e => {
      val (k, v) = e
      println(k + "=" + v)
    });

    wordCounts.saveAsTextFile(FILE_NAME + System.currentTimeMillis());
    println("Word Count program running results are successfully saved.");
  }
}

最后编辑于
©著作权归作者所有,转载或内容合作请联系作者
平台声明:文章内容(如有图片或视频亦包括在内)由作者上传并发布,文章内容仅代表作者本人观点,简书系信息发布平台,仅提供信息存储服务。