数据样例:
java,spark,hadoop,python,datax
java,spark,hadoop,spark,python,datax
java,spark,hadoop,python,datax
java,spark,hadoop,spark,python
java,spark,hadoop,spark,python,datax
java,spark,hadoop,python,datax
java,spark,hadoop,python,datax
java,spark,hadoop,spark,python,datax
java,spark,hadoop,python,datax
java,spark,hadoop,spark,python,datax
hadoop,spark,spark,python
package com.shujia import scala.io.Source object Test1wordcount { def main(args: Array[String]): Unit = { //读取文件,并将转换成list集合 val list: List[String] = Source.fromFile("data/words.txt").getLines().toList //将list集合按照分隔键进行展开 val words: List[String] = list.flatMap((lines: String) => lines.split(",")) //分组 val groupBy: Map[String, List[String]] = words.groupBy((word: String) =>word) //统计单词数量 val wordCount: Map[String, Int] = groupBy.map((kv: (String, List[String])) => { //分组单词 val word: String = kv._1 //组内所有单词 val value: List[String] = kv._2 //求出数组内的长度 val count: Int = value.length //返回单词的数量 (word, count) }) wordCount.foreach(println) } }
输出结果:
F:\soft\java\jdk\bin\java.exe "-javaagent:F:\soft\IDEA\IntelliJ (datax,36) (java,40) (hadoop,44) (spark,68) (python,44) Process finished with exit code 0
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】凌霞软件回馈社区,博客园 & 1Panel & Halo 联合会员上线
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】博客园社区专享云产品让利特惠,阿里云新客6.5折上折
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· 一个费力不讨好的项目,让我损失了近一半的绩效!
· 清华大学推出第四讲使用 DeepSeek + DeepResearch 让科研像聊天一样简单!
· 实操Deepseek接入个人知识库
· CSnakes vs Python.NET:高效嵌入与灵活互通的跨语言方案对比
· Plotly.NET 一个为 .NET 打造的强大开源交互式图表库