返回第一个元素
scala
scala> val rdd = sc.parallelize(List(1,2,3,3))
scala> rdd.first()
res1: Int = 1
java
JavaRDD...val rdd = sc.parallelize(List(1,2,3,3))
scala> rdd.take(2)
res3: Array[Int] = Array(1, 2)
java
JavaRDD...= sc.parallelize(List(1,2,3,3))
scala> rdd.collect()
res4: Array[Int] = Array(1, 2, 3, 3)
java
JavaRDD...scala> rdd.countByValue()
res6: scala.collection.Map[Int,Long] = Map(1 -> 1, 2 -> 1, 3 -> 2)
java
JavaRDD...> val rdd = sc.parallelize(List(1,2,3,3),2)
scala> rdd.fold(1)((x,y)=>x+y)
res8: Int = 12
java
JavaRDD