代码拉取完成,页面将自动刷新
import model.Info;
import org.apache.spark.api.java.JavaPairRDD;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.api.java.function.Function;
import org.apache.spark.sql.Dataset;
import org.apache.spark.sql.Row;
import org.apache.spark.sql.SaveMode;
import org.apache.spark.sql.SparkSession;
import scala.Tuple2;
import java.util.Arrays;
public class WordCountSql {
public static void main(String[] args) {
SparkSession spark = SparkSession.builder()
.appName("RDDToDataset")
.master("local[*]")
.getOrCreate();
JavaRDD<String> lines = spark.read().textFile("src/main/resources/data").javaRDD();
JavaRDD<String> words = lines.flatMap(line -> Arrays.asList(line.split(" ")).iterator());
JavaRDD<Info> stuRDD = words.map(new Function<String, Info>() {
public Info call(String line) throws Exception {
System.out.println(line);
Info stu = new Info();
stu.setWord(line);
stu.setCnt(1);
return stu;
}
});
Dataset<Row> stuDf = spark.createDataFrame(stuRDD, Info.class);
stuDf.printSchema();
stuDf.createOrReplaceTempView("info");
Dataset<Row> nameDf = spark.sql("select word,count(cnt) as cnt from info group by word");
nameDf.show();
nameDf.coalesce(2).write().mode(SaveMode.Overwrite).format("csv").csv("src/main/resources/result");
spark.stop();
}
}
此处可能存在不合适展示的内容,页面不予展示。您可通过相关编辑功能自查并修改。
如您确认内容无涉及 不当用语 / 纯广告导流 / 暴力 / 低俗色情 / 侵权 / 盗版 / 虚假 / 无价值内容或违法国家有关法律法规的内容,可点击提交进行申诉,我们将尽快为您处理。