热门标签 | HotTags
当前位置:  开发笔记 > 编程语言 > 正文

sparkwordcountjava_spark入门:wordcountjava

wordcount-java:pom.xml文件如下:junitjunit3.8.1testorg.apache.sparkspark-core_2.101.3.0o

wordcount-java:

pom.xml文件如下:

junit

junit

3.8.1

test

org.apache.spark

spark-core_2.10

1.3.0

org.apache.spark

spark-sql_2.10

1.3.0

org.apache.spark

spark-hive_2.10

1.3.0

org.apache.spark

spark-streaming_2.10

1.3.0

org.apache.hadoop

hadoop-client

2.4.1

org.apache.spark

spark-streaming-kafka_2.10

1.3.0

package cn.spark.study.core;

import java.util.Arrays;

import org.apache.spark.SparkConf;

import org.apache.spark.api.java.JavaPairRDD;

import org.apache.spark.api.java.JavaRDD;

import org.apache.spark.api.java.JavaSparkContext;

import org.apache.spark.api.java.function.FlatMapFunction;

import org.apache.spark.api.java.function.Function2;

import org.apache.spark.api.java.function.PairFunction;

import org.apache.spark.api.java.function.VoidFunction;

import scala.Tuple2;

public class WordCount3 {

public static void main(String[] args) {

SparkConf cOnf=new SparkConf().setAppName("WorldCountLocal").setMaster("local");

JavaSparkContext sc=new JavaSparkContext(conf);

JavaRDD lines=sc.textFile("C:\\Users\\wanglonglong\\Desktop\\word.txt");

JavaRDD words=lines.flatMap(new FlatMapFunction() {

@Override

public Iterable call(String t) throws Exception {

// TODO Auto-generated method stub

return Arrays.asList(t.split(" "));

}

});

JavaPairRDD pairs = words.mapToPair(new PairFunction() {

private static final long serialVersiOnUID=1;

@Override

public Tuple2 call(String word) throws Exception {

return new Tuple2(word,1);

}

});

JavaPairRDD wordCounts = pairs.reduceByKey(

new Function2() {

private static final long serialVersiOnUID= 1L;

public Integer call(Integer v1, Integer v2) throws Exception {

return v1 + v2;

}

});

wordCounts.foreach(new VoidFunction>() {

private static final long serialVersiOnUID= 1L;

public void call(Tuple2 wordCount) throws Exception {

System.out.println("("+wordCount._1 + "," + wordCount._2 + " )");

}

});

sc.close();

}

}

332622d2c16076dd9edee338184ed060.png

7055747f20ecc3fa74918e7d198eb2da.png



推荐阅读
author-avatar
爱与嫉妒咋
这个家伙很懒,什么也没留下!
PHP1.CN | 中国最专业的PHP中文社区 | DevBox开发工具箱 | json解析格式化 |PHP资讯 | PHP教程 | 数据库技术 | 服务器技术 | 前端开发技术 | PHP框架 | 开发工具 | 在线工具
Copyright © 1998 - 2020 PHP1.CN. All Rights Reserved | 京公网安备 11010802041100号 | 京ICP备19059560号-4 | PHP1.CN 第一PHP社区 版权所有