zoukankan      html  css  js  c++  java
  • 数据筛选

    数据准备

    route_log

    Apr 23 11:49:54 hostapd: wlan0: STA 14:7d:c5:9e:fb:84

    Apr 23 11:49:52 hostapd: wlan0: STA 74:e5:0b:04:28:f2

    Apr 23 11:49:50 hostapd: wlan0: STA cc:af:78:cc:d5:5d

    Apr 23 11:49:44 hostapd: wlan0: STA cc:af:78:cc:d5:5d

    Apr 23 11:49:43 hostapd: wlan0: STA 14:7d:c5:9e:fb:84

    Apr 23 11:49:42 hostapd: wlan0: STA 74:e5:0b:04:28:f2

    将route_log上传到HDFS上,从route_log中筛选  : month day mac 

    代码编写

    import org.apache.hadoop.conf.Configuration;
    import org.apache.hadoop.conf.Configured;
    import org.apache.hadoop.fs.Path;
    import org.apache.hadoop.io.LongWritable;
    import org.apache.hadoop.io.NullWritable;
    import org.apache.hadoop.io.Text;
    import org.apache.hadoop.mapreduce.Job;
    import org.apache.hadoop.mapreduce.Mapper;
    import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
    import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
    import org.apache.hadoop.util.Tool;
    import org.apache.hadoop.util.ToolRunner;
    
    public class Route_filter extends Configured implements Tool {
    
    @Override
    public int run(String[] args) throws Exception {
    // TODO Auto-generated method stub
    Configuration conf = getConf();
    Job job = new Job(conf, "route_filter");
    job.setJarByClass(Route_filter.class);
    job.setOutputKeyClass(Text.class);
    job.setOutputValueClass(NullWritable.class);
    job.setMapperClass(RouteMap.class);
    FileInputFormat.addInputPath(job, new Path("/value/route_log"));
    FileOutputFormat.setOutputPath(job, new Path("/outvalue/outroute_log"));
    job.submit();
    return job.isSuccessful() ? 0 : 1;
    }
    
    public static void main(String[] args) throws Exception {
    ToolRunner.run(new Configuration(), new Route_filter(), null);
    }
    }
    
    class RouteMap extends Mapper<LongWritable, Text, Text, NullWritable> {
    private Text result = new Text();
    
    protected void map(LongWritable key, Text value, Context context)
    throws java.io.IOException, InterruptedException {
    String lineValue = value.toString();
    String[] lineSplit = lineValue.split(" ");
    String month = lineSplit[0];
    String day = lineSplit[1];
    String mac = lineSplit[6];
    result.set(month + " " + day + " " + mac);
    context.write(result, NullWritable.get());
    }
    }
    

      

    最终输出结果:

    Apr 23 14:7d:c5:9e:fb:84
    Apr 23 14:7d:c5:9e:fb:84
    Apr 23 74:e5:0b:04:28:f2
    Apr 23 74:e5:0b:04:28:f2
    Apr 23 cc:af:78:cc:d5:5d
    Apr 23 cc:af:78:cc:d5:5d

  • 相关阅读:
    jQuery的选择器中的通配符[id^='code']
    浏览器调试js
    google浏览器调试js
    【暑假】[实用数据结构]UVAlive 3026 Period
    【暑假】[实用数据结构]UVAlive 3942 Remember the Word
    【暑假】[实用数据结构] AC自动机
    【暑假】[实用数据结构]KMP
    【暑假】[实用数据结构]前缀树 Trie
    【暑假】[实用数据结构]UVa11235 Frequent values
    【暑假】[实用数据结构]UVAlive 4329 Ping pong
  • 原文地址:https://www.cnblogs.com/LgyBean/p/5037081.html
Copyright © 2011-2022 走看看