hadoop上的两种运行mapreduce程序的方法

之前学习了一段时间的hadoop的相关知识，学习理论基础的时候要同时实际操作才能对它更熟练，废话不多说来说说在hadoop上运行一个最简单的words count的程序

首先我先贴上这个程序的源代码供大家参考代码分为三个部分写的Run、 map阶段、 reduce阶段

Map：


  
  
   
   
    
    
     
     
    
    
    
    
     
     
      
      package wordsCount;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import java.io.IOException;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import java.util.StringTokenizer;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.io.IntWritable;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.io.LongWritable;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.io.Text;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.mapreduce.Mapper;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      public 
      
      class WordsMapper extends Mapper<LongWritable, Text, Text, IntWritable>{
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     	
      
      @Override
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     	
      
      protected void map(LongWritable key, Text value, Mapper<LongWritable, Text, Text, IntWritable>.Context context)
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     			
      
      throws IOException, InterruptedException {
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		String line = value.toString();
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		StringTokenizer st = 
      
      new StringTokenizer(line);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
      
      while(st.hasMoreTokens()){
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      			String word = st.nextToken();
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      			context.write(
      
      new Text(word), 
      
      new IntWritable(
      
      1));
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		}
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      	}
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      }

Reduce：


  
  
   
   
    
    
     
     
    
    
    
    
     
     
      
      package wordsCount;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import java.io.IOException;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.io.IntWritable;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.io.Text;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.mapreduce.Reducer;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      public 
      
      class WordsReduce extends Reducer<Text, IntWritable, Text, IntWritable>{
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     	
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     	
      
      @Override
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     	
      
      protected void reduce(Text key, Iterable<IntWritable> iterator,
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      			Reducer<Text, IntWritable, Text, IntWritable>.Context context) 
      
      throws IOException, InterruptedException {
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
      
      // TODO 自动生成的方法存根
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
      
      int sum = 
      
      0;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
      
      for(IntWritable i:iterator){
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      			sum = sum + i.get();
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		}
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		context.write(key, 
      
      new IntWritable(sum));
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      	}
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      }

Run：


  
  
   
   
    
    
     
     
    
    
    
    
     
     
      
      package wordsCount;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.conf.Configuration;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.fs.Path;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.io.IntWritable;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.io.Text;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.mapreduce.Job;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      public 
      
      class Run {
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     	
      
      public static void main(String[] args) throws Exception{
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
      
      // TODO 自动生成的方法存根
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		Configuration configuration = 
      
      new Configuration();
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		Job job = 
      
      new Job(configuration);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setJarByClass(Run.class);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setJobName(
      
      "words count!");
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setOutputKeyClass(Text.class);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setOutputValueClass(IntWritable.class);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setInputFormatClass(TextInputFormat.class);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setOutputFormatClass(TextOutputFormat.class);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setMapperClass(WordsMapper.class);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.setReducerClass(WordsReduce.class);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     		
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		FileInputFormat.addInputPath(job, 
      
      new Path(
      
      "hdfs://192.168.1.111:9000/user/input/wc/"));
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		FileOutputFormat.setOutputPath(job,
      
      new Path(
      
      "hdfs://192.168.1.111:9000/user/result/"));
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
      
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      		job.waitForCompletion(
      
      true);
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      	}
     
     
    
    
   
   
    
    
     
     
    
    
    
    
     
     
      
      }