2019-05-14 23:15:10 +08:00

769 B

val list = List(3,6,9,10,12,21) val listRDD = sc.parallelize(list) val intsRDD = listRDD.map(_*10) intsRDD.foreach(println)

sc.parallelize(list).map(_*10).foreach(println)

sc.parallelize(list).filter(_>=10).foreach(println)

val list = List(List(1, 2), List(3), List(), List(4, 5)) sc.parallelize(list).flatMap(.toList).map(*10).foreach(println)

val list = List(1,2,3,4,5) sc.parallelize(list).reduce((x,y) => x+y) sc.parallelize(list).reduce(+)

val list = List(("hadoop", 2), ("spark", 3), ("spark", 5), ("storm", 6),("hadoop", 2)) sc.parallelize(list).reduceByKey(+).foreach(println)

val list = List(("hadoop", 2), ("spark", 3), ("spark", 5), ("storm", 6),("hadoop", 2)) sc.parallelize(list).groupByKey().map(x=>(x._1,x._2.toList)).foreach(println)