import org.apache.spark.SparkConf;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.api.java.JavaSparkContext;
import org.apache.spark.api.java.function.FlatMapFunction;
import org.apache.spark.api.java.function.Function;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Iterator;
import java.util.List;
public class MapPartitionsDemo {
public static void main(String[] args) {
SparkConf conf = new SparkConf().setMaster("local").setAppName("spark");
JavaSparkContext sc = new JavaSparkContext(conf);
List<Integer> list = Arrays.asList(1, 2, 3, 4, 5, 6);
JavaRDD<Integer> javaRDD = sc.parallelize(list,2);
JavaRDD<Integer> javaRDD1 = javaRDD.mapPartitions(new FlatMapFunction<Iterator<Integer>, Integer>() {
@Override
public Iterator<Integer> call(Iterator<Integer> integerIterator) throws Exception {
List<Integer> arrayList = new ArrayList<>();
while (integerIterator.hasNext()){
int flag = integerIterator.next();
for (int i=0;i<=flag;i++){
arrayList.add(flag * i);
}
}
return arrayList.iterator();
}
},true);
System.err.println(javaRDD1.collect());
JavaRDD<Integer> integerJavaRDD = javaRDD1.repartition(4);
System.out.println(integerJavaRDD.collect());
JavaRDD<Integer> javaRDD2 = javaRDD.mapPartitions(integerIterator -> {
List<Integer> arrayList = new ArrayList<>();
while (integerIterator.hasNext()){
int flag = integerIterator.next();
for (int i=0;i<=flag;i++){
arrayList.add(flag * i);
}
}
return arrayList.iterator();
},true);
System.err.println(javaRDD2.collect());
}
}