Hadoop implements grep sample sharing

  • 2020-04-01 03:11:02
Hadoop makes a simple grep program that extracts lines containing certain strings from documents

public class grep extends Configured  implements Tool{
 public static  class grepMap extends Mapper<LongWritable, Text, Text,NullWritable>{

  public void map(LongWritable line,Text value,Context context) throws IOException, InterruptedException{
   //Get the parameters through the Configuration
   String str = context.getConfiguration().get("grep");
    context.write(value, NullWritable.get());
 public int run(String[] args) throws Exception {


  Configuration configuration = getConf();
  //Passing parameters
  configuration.set("grep", args[2]);
  Job job = new Job(configuration,"grep");



  Path in = new Path(args[0]);
  Path out = new Path(args[1]);
  FileSystem fileSystem = out.getFileSystem(configuration);
   fileSystem.delete(out, true);

  FileInputFormat.addInputPath(job, in);
  FileOutputFormat.setOutputPath(job, out);

  return 0;

