KeyValueTextInputFormat实例
来源:互联网 发布:mac jenkins 启动 编辑:程序博客网 时间:2024/06/02 05:31
package inputformat;import java.net.URI;import org.apache.hadoop.conf.Configuration;import org.apache.hadoop.fs.FileSystem;import org.apache.hadoop.fs.Path;import org.apache.hadoop.io.LongWritable;import org.apache.hadoop.io.Text;import org.apache.hadoop.mapreduce.Job;import org.apache.hadoop.mapreduce.Mapper;import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;import org.apache.hadoop.mapreduce.lib.input.KeyValueLineRecordReader;import org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat;import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;/** * helloyouhelloyou * hellome * */public class MyKeyValueTextInputFormatApp {private static final String INPUT_PATH = "hdfs://chaoren1:9000/hello";private static final String OUT_PATH = "hdfs://chaoren1:9000/out";public static void main(String[] args) throws Exception{Configuration conf = new Configuration(); //使用特定的分割符分开conf.set(KeyValueLineRecordReader.KEY_VALUE_SEPERATOR, "\t");final FileSystem filesystem = FileSystem.get(new URI(OUT_PATH), conf);filesystem.delete(new Path(OUT_PATH), true);final Job job = new Job(conf , MyKeyValueTextInputFormatApp.class.getSimpleName());job.setJarByClass(MyKeyValueTextInputFormatApp.class);FileInputFormat.setInputPaths(job, INPUT_PATH);job.setInputFormatClass(KeyValueTextInputFormat.class);job.setMapperClass(MyMapper.class);job.setMapOutputKeyClass(Text.class);job.setMapOutputValueClass(LongWritable.class);job.setNumReduceTasks(0);job.setOutputKeyClass(Text.class);job.setOutputValueClass(LongWritable.class);FileOutputFormat.setOutputPath(job, new Path(OUT_PATH));job.waitForCompletion(true);}public static class MyMapper extends Mapper<Text, Text, Text, LongWritable>{protected void map(Text key, Text value, org.apache.hadoop.mapreduce.Mapper<Text,Text,Text,LongWritable>.Context context) throws java.io.IOException ,InterruptedException {context.write(key, new LongWritable(1));context.write(value, new LongWritable(1));};}}
0 0
- KeyValueTextInputFormat实例
- hadoop 之 InputFormat类 --- KeyValueTextInputFormat 实例
- KeyValueTextInputFormat 重写
- KeyValueTextInputFormat用法
- MapReduce的KeyValueTextInputFormat
- KeyValueTextInputFormat 分割key value For hadoop 1.0
- KeyValueTextInputFormat 分割key value For hadoop 1.0
- Hadoop Problem : hadoop0.20.2中的KeyValueTextInputFormat
- MapReduce的输入格式---KeyValueTextInputFormat---源码分析
- KeyValueTextInputFormat 分割key value 设置问题:key.value.separator.in.input.line
- 实例
- 实例
- 实例
- 实例
- 实例
- 实例
- 实例
- 实例
- GenericWritable实例
- 创业总结:创业公司怎样留人
- 用摄像头进行人脸和人眼实时检测的优化 算法
- hdu_1013_Digital Roots(模拟)
- linux内核编译
- KeyValueTextInputFormat实例
- java Heap Dump基本概念及如何获取
- Toad趣题:说真话的程序员 & 不说实话的经理
- HPU1287: HH实习 【贪心】
- java自学系列之0
- NLineInputFormat实例
- c++地址复制strcpy
- android中使用Application
- 开源代码学习之——NoBoringActionBar