CombinerTest
package a.b.c;
import java.io.IOException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
//求取NASA的每个ip的访问次数
class SumMapper extends Mapper<LongWritable, Text, Text, IntWritable>{
@Override
protected void map(LongWritable key, Text value,Context context)
throws IOException, InterruptedException {
String lineString=value.toString();
String []wordStrings=lineString.split(" ");
String visitorIP=wordStrings[0];
context.write(new Text(visitorIP), new IntWritable(1));
}
}
class SumCombiner extends Reducer<Text, IntWritable, Text, IntWritable>{
@Override
protected void reduce(Text key, Iterable<IntWritable> val,Context context)
throws IOException, InterruptedException {
int sum=0;
for (IntWritable values:val){
sum+=values.get();
}
context.write(key, new IntWritable(sum));
}
}
class SumReducer extends Reducer<Text,IntWritable,Text,IntWritable>{
@Override
protected void reduce(Text key, Iterable<IntWritable> val,Context context)
throws IOException, InterruptedException {
int sum=0;
for (IntWritable values:val){
sum+=values.get();
}
context.write(key, new IntWritable(sum));
}
}
public class CombinerTest {
public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException {
Configuration configuration=new Configuration();
Job job=Job.getInstance(configuration);
//设置类
job.setJarByClass(CombinerTest.class);
//设置mapper类
job.setMapperClass(SumMapper.class);
job.setMapOutputKeyClass(Text.class);
job.setMapOutputValueClass(IntWritable.class);
//设置combiner类
job.setCombinerClass(SumCombiner.class);
//设置reducer类
job.setReducerClass(SumReducer.class);
job.setOutputKeyClass(Text.class);
job.setOutputValueClass(IntWritable.class);
//File
FileInputFormat.addInputPath(job,new Path(args[0]));
FileOutputFormat.setOutputPath(job,new Path(args[1]));
System.exit(job.waitForCompletion(true) ? 0 : 1);
}
}
MapReduceAPI
最新推荐文章于 2022-03-17 12:35:21 发布