MRUnit是一个基于JUnit的单元测试框架,专门用来对Hadoop框架的MapReduce进行单元测试。MRUnit针对于不同的测试对象使用不同的Driver:
- MapDriver,针对单独的Map测试。
- ReduceDriver,针对单独的Reduce进行测试。
- MapReduceDriver,将Map和Reduce连贯起来进行测试。
1、添加依赖
<dependency>
<groupId>org.apache.mrunitgroupId>
<artifactId>mrunitartifactId>
<version>1.1.0version>
<classifier>hadoop2classifier>
dependency>
<!— 添加依赖时注意classifier,区分hadoop1和hadoop2,mapreduceV1配置hadoop1,mapreduceV2配置hadoop2 -->
2、MapReduce程序类
package mapreduce;
import mywritable.PariWritable;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.util.Tool;
import org.apache.hadoop.util.ToolRunner;
import java.io.IOException;
public class SortWCMapReduce extends Configured implements Tool {
//Mapper类
public static class SortWCMapper extends
Mapper<LongWritable, Text, PariWritable, IntWritable> {
@Override
protected void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException {
String lineValue = value.toString();
String[] strs = lineValue.split(",");
PariWritable mapOutputKey = new PariWritable(strs[0], Integer.valueOf(strs[1]));
context.write(mapOutputKey, new IntWritable(mapOutputKey.getSecond()));
}
}
//Reducer类
public static class SortWCReducer extends
Reducer<PariWritable, IntWritable, Text, IntWritable> {
@Override
public void reduce(PariWritable key, Iterable values,
Context context) throws IOException, InterruptedException {
for (IntWritable value : values) {
context.write(new Text(key.getFirst()), value);
}
}
}
//Driver驱动方法
public int run(String[] args) throws Exception {
//获取配置
Configuration configuration = this.getConf();
//创建job
Job job = Job.getInstance(configuration, SortWCMapReduce.class.getSimpleName());
//指定MapReduce主类
job.setJarByClass(SortWCMapReduce.class);
//指定输入路径
Path inpath = new Path(args[0]);
FileInputFormat.addInputPath(job, inpath);
//指定输出路径
Path outpath = new Path(args[1]);
FileOutputFormat.setOutputPath(job, outpath);
job.setInputFormatClass(TextInputFormat.class);
job.setMapperClass(SortWCMapper.class);
job.setMapOutputKeyClass(PariWritable.class);
job.setMapOutputValueClass(IntWritable.class);
job.setReducerClass(SortWCReducer.class);
job.setOutputKeyClass(Text.class);
job.setOutputValueClass(IntWritable.class);
boolean isSucces = job.waitForCompletion(true);
return isSucces ? 0 : 1;
}
public static void main(String[] args) throws Exception {
Configuration configuration = new Configuration();
int status = ToolRunner.run(configuration, new SortWCMapReduce(),
args);
System.exit(status);
}
}
3、自定义类型类
package mywritable;
import org.apache.hadoop.io.WritableComparable;
import java.io.DataInput;
import java.io.DataOutput;
import java.io.IOException;
/**
* Created by 鸣宇淳 on 2017/5/15.
*/
public class PariWritable implements WritableComparable<PariWritable> {
private String first;
private Integer second;
public String getFirst() {
return first;
}
public Integer getSecond() {
return second;
}
public PariWritable() {
}
public PariWritable(String f, Integer s) {
this.set(f, s);
}
public void set(String f, Integer s) {
this.first = f;
this.second = s;
}
public void write(DataOutput dataOutput) throws IOException {
dataOutput.writeUTF(first);
dataOutput.writeInt(second);
}
public void readFields(DataInput dataInput) throws IOException {
this.first = dataInput.readUTF();
this.second = dataInput.readInt();
}
@Override
public String toString() {
return first + "|" + second;
}
@Override
public boolean equals(Object obj) {
if (obj == null) {
return false;
}
if (!(obj instanceof PariWritable)) {
return false;
} else {
PariWritable other = (PariWritable) obj;
return this.first.equals(other.first) && this.second.compareTo(other.second) == 0;
}
}
public int compareTo(PariWritable o) {
//先比较第一个,如果第一个相同,比较第二个
int comp = this.first.compareTo(o.first);
if (comp == 0) {
comp= this.second.compareTo(o.second);
}
return comp;
}
}
4、单元测试类
import mapreduce.SortWCMapReduce;
import mywritable.PariWritable;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mrunit.mapreduce.MapDriver;
import org.apache.hadoop.mrunit.mapreduce.ReduceDriver;
import org.junit.Before;
import org.junit.Test;
import java.io.IOException;
import java.util.ArrayList;
/**
* Created by 鸣宇淳 on 2017/5/12.
*/
public class SortWCMapReduceTest {
MapDriver mapDriver;
ReduceDriver reduceDriver;
@Before
public void setUp() {
SortWCMapReduce.SortWCMapper mapper = new SortWCMapReduce.SortWCMapper();
SortWCMapReduce.SortWCReducer reduce = new SortWCMapReduce.SortWCReducer();
mapDriver = new MapDriver(mapper);
reduceDriver = new ReduceDriver(reduce);
}
//Map测试方法
@Test
public void testMapper() throws IOException {
mapDriver.withInput(new LongWritable(), new Text("655209,3"));
mapDriver.withOutput(new PariWritable("655209", 3), new IntWritable(3));
mapDriver.runTest();
}
//reduce测试方法
@Test
public void testReduce() throws IOException {
reduceDriver.withInput(new PariWritable("62669", 5), new ArrayList() {
{
add(new IntWritable(1));
add(new IntWritable(3));
}
});
reduceDriver.withOutput(new Text("62669"), new IntWritable(1))
.withOutput(new Text("62669"), new IntWritable(3));
reduceDriver.runTest();
}
//MapReduce整体测试方法
@Test
public void testMapReduce() {
mapReduceDriver.withInput(new LongWritable(), new Text("10001,4"))
.withInput(new LongWritable(), new Text("10002,2"))
.withInput(new LongWritable(), new Text("10001,2"))
mapReduceDriver.withOutput(new Text("10001"), new IntWritable(2))
.withOutput(new Text("10001"), new IntWritable(4))
.withOutput(new Text("10002"), new IntWritable(2));
}
}