object WordCount {
def main(args: Array[String]): Unit = {
val sparkConf =new SparkConf().setMaster("local").setAppName("WordCount")
val sc= new SparkContext(sparkConf)
val datas: RDD[(String,Int)] = sc.makeRDD(
List(("Spark",5),("Hadoop",3),("Scala",4),("Spark",3),("Hadoop",1)),5)
val a = datas.groupByKey() //按key分组 (张三,CompactBuffer(78, 80, 88))
.map(x => {
var num = 0
var sum = 0
for (i <- x._2) {
sum = sum + i
num = num + 1
}
val avg = sum / num
(x._1, avg)
})
a.collect.foreach(x => println(x._1+"\t"+x._2))
//关闭毗连
sc.stop()
}}