利用MapReduce分析数据

实践内容内容

 

 

代码:

package shiyan1;


import java.io.IOException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.NullWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
public class test{
    public static class Map extends Mapper<Object,Text , Text , NullWritable>{
    private static Text newKey=new Text();
    public void map(Object key,Text value,Context context) throws IOException, InterruptedException{
    String line=value.toString();
    System.out.println("line"+line);
    String arr[]=line.split("   ");
    newKey.set(arr[1]);
    context.write(newKey, NullWritable.get());
    System.out.println("newKey"+newKey);
    }
    }
    public static class Reduce extends Reducer<Text, NullWritable, Text, NullWritable>{
    public void reduce(Text key,Iterable<NullWritable> values,Context context) throws IOException, InterruptedException{
    context.write(key,NullWritable.get());
    }
    }
    public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException{
    Configuration conf=new Configuration();
    System.out.println("start");
    Job job = Job.getInstance(conf);
    job.setJarByClass(test.class);
    job.setMapperClass(Map.class);
    job.setReducerClass(Reduce.class);
    job.setOutputKeyClass(Text.class);
    job.setOutputValueClass(NullWritable.class);
    job.setInputFormatClass(TextInputFormat.class);
    job.setOutputFormatClass(TextOutputFormat.class);
    Path in=new Path("D:\\mapshiyan\\one\\in");
    Path out=new Path("D:\\mapshiyan\\one\\out3");
    FileInputFormat.addInputPath(job,in);
    FileOutputFormat.setOutputPath(job,out);
    System.exit(job.waitForCompletion(true) ? 0 : 1);
    }
}

结果

 

posted @ 2020-11-07 20:36  yizhixiaozhu  阅读(386)  评论(0编辑  收藏  举报