package demos; import java.io.IOException; import java.util.Iterator; import java.util.StringTokenizer; import org.apache.hadoop.fs.Path; import org.apache.hadoop.io.BooleanWritable; import org.apache.hadoop.io.IntWritable; import org.apache.hadoop.io.LongWritable; import org.apache.hadoop.io.Text; import org.apache.hadoop.mapred.FileInputFormat; import org.apache.hadoop.mapred.FileOutputFormat; import org.apache.hadoop.mapred.JobClient; import org.apache.hadoop.mapred.JobConf; import org.apache.hadoop.mapred.MapReduceBase; import org.apache.hadoop.mapred.Mapper; import org.apache.hadoop.mapred.OutputCollector; import org.apache.hadoop.mapred.Reducer; import org.apache.hadoop.mapred.Reporter; public class WordFreqMapper extends MapReduceBase implements Mapper{ private static final IntWritable one = new IntWritable(1); private IntWritable freq = new IntWritable(); public void map(LongWritable key, Text value, OutputCollector output, Reporter reporter) throws IOException { String[] parts = value.toString().split("\\t"); freq.set(Integer.parseInt(parts[1])); output.collect(freq, one); } }