Skip to content

WordCount version one

Dennis Dawson edited this page Aug 28, 2015 · 11 revisions
package org.myorg;

import java.io.IOException;
import java.util.regex.Pattern;
import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.util.Tool;import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.util.ToolRunner;
import org.apache.log4j.Logger;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
public class WordCount extends Configured implements Tool {

  private static final Logger LOG = Logger .getLogger( WordCount .class);
  public static void main( String[] args) throws  Exception {
    int res  = ToolRunner .run( new WordCount(), args);
    System .exit(res);
  }
  public int run( String[] args) throws  Exception {
  Job job  = Job .getInstance(getConf(), " wordcount ");
  job.setJarByClass( this .getClass());
  FileInputFormat.addInputPaths(job,  new Path(args[ 0]));
  FileOutputFormat.setOutputPath(job,  new Path(args[ 1]));
  job.setMapperClass( Map .class);
  job.setReducerClass( Reduce .class);
  job.setOutputKeyClass( Text .class);
  job.setOutputValueClass( IntWritable .class);
  return job.waitForCompletion( true)  ? 0 : 1;
  }
}

Clone this wiki locally