Spark Java WordCount:长尾,揭示大数据中的隐秘问题。
- 内容介绍
- 文章标签
- 相关推荐
本文共计194个文字,预计阅读时间需要1分钟。
javaimport java.util.Arrays;import org.apache.spark.api.java.JavaPairRDD;import org.apache.spark.api.java.JavaRDD;import org.apache.spark.sql.SparkSession;import scala.Tuple2;
public class WordCount3 { public static void main(String[] args) { SparkSession spark=SparkSession.builder().appName(Word Count).getOrCreate(); JavaRDD textFile=spark.sparkContext().textFile(path_to_text_file); JavaRDD words=textFile.flatMap(line -> Arrays.asList(line.split( )).iterator()); JavaPairRDD pairs=words.mapToPair(word -> new Tuple2(word, 1)); JavaPairRDD wordCounts=pairs.reduceByKey((a, b) -> a + b); wordCounts.collect().forEach(System.out::println); }}
WordCountimport java.util.Arrays;
import org.apache.spark.api.java.JavaPairRDD;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.sql.SparkSession;
import scala.Tuple2;
public class WordCount3 {
public static void main(String[] args) {
SparkSession spark = SparkSession.builder().master("local").appName("WordCount3").getOrCreate();
JavaRDD
本文共计194个文字,预计阅读时间需要1分钟。
javaimport java.util.Arrays;import org.apache.spark.api.java.JavaPairRDD;import org.apache.spark.api.java.JavaRDD;import org.apache.spark.sql.SparkSession;import scala.Tuple2;
public class WordCount3 { public static void main(String[] args) { SparkSession spark=SparkSession.builder().appName(Word Count).getOrCreate(); JavaRDD textFile=spark.sparkContext().textFile(path_to_text_file); JavaRDD words=textFile.flatMap(line -> Arrays.asList(line.split( )).iterator()); JavaPairRDD pairs=words.mapToPair(word -> new Tuple2(word, 1)); JavaPairRDD wordCounts=pairs.reduceByKey((a, b) -> a + b); wordCounts.collect().forEach(System.out::println); }}
WordCountimport java.util.Arrays;
import org.apache.spark.api.java.JavaPairRDD;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.sql.SparkSession;
import scala.Tuple2;
public class WordCount3 {
public static void main(String[] args) {
SparkSession spark = SparkSession.builder().master("local").appName("WordCount3").getOrCreate();
JavaRDD

