MapReduce编程模板

mvplee

浏览: 73453 次

最近访客更多访客>>

simon1991

liangliang01

loren_mt

pistolove

博主相关

博客

微博

相册

留言

关于我

文章分类

社区版块

存档分类

博客分类：

Hadoop

import java.io.IOException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
import org.apache.hadoop.mapreduce.lib.partition.HashPartitioner;
import org.apache.hadoop.util.Tool;
import org.apache.hadoop.util.ToolRunner;

public class ModuleMapReduce extends Configured implements Tool {

	static class ModuleMapper extends
			Mapper<LongWritable, Text, Text, IntWritable> {
		@Override
		protected void setup(
				Mapper<LongWritable, Text, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.setup(context);
		}

		@Override
		protected void map(LongWritable key, Text value,
				Mapper<LongWritable, Text, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.map(key, value, context);
		}

		@Override
		protected void cleanup(
				Mapper<LongWritable, Text, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.cleanup(context);
		}

		@Override
		public void run(
				Mapper<LongWritable, Text, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.run(context);
		}

	}

	static class ModuleReducer extends
			Reducer<Text, IntWritable, Text, IntWritable> {
		@Override
		protected void setup(
				Reducer<Text, IntWritable, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.setup(context);
		}

		@Override
		protected void reduce(Text key, Iterable<IntWritable> values,
				Reducer<Text, IntWritable, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.reduce(key, values, context);
		}

		@Override
		protected void cleanup(
				Reducer<Text, IntWritable, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.cleanup(context);
		}

		@Override
		public void run(
				Reducer<Text, IntWritable, Text, IntWritable>.Context context)
				throws IOException, InterruptedException {
			// TODO Auto-generated method stub
			super.run(context);
		}

	}

	@Override
	public int run(String[] args) throws Exception {
		if (checkArgs(args) != 0)
			return checkArgs(args);

		Job job = getJob();
		//set input/output path
		FileInputFormat.addInputPath(job, new Path(args[0]));
		FileOutputFormat.setOutputPath(job, new Path(args[1]));
		// set run jar class when package need
		job.setJarByClass(ModuleMapper.class);
		//set map info
		job.setMapperClass(ModuleMapper.class);
		job.setInputFormatClass(TextInputFormat.class);
		job.setMapOutputKeyClass(Text.class);
		job.setMapOutputValueClass(LongWritable.class);
		//set partition
		job.setPartitionerClass(HashPartitioner.class);
		job.setNumReduceTasks(1);
		//set reduce info
		job.setReducerClass(ModuleReducer.class);
		job.setOutputFormatClass(TextOutputFormat.class);
		job.setOutputKeyClass(Text.class);
		job.setOutputValueClass(IntWritable.class);

		return job.waitForCompletion(true) ? 0 : 1;
	}

	private Configuration getConfiguration() {
		Configuration conf = new Configuration();
		return conf;
	}

	private Job getJob() throws IOException {
		Configuration conf = getConfiguration();
		Job job = new Job(conf, ModuleMapReduce.class.getSimpleName());
		return job;
	}

	private int checkArgs(String[] args) {
		if (args.length != 2) {
			System.err.println("args error");
			return 1;
		}
		return 0;
	}

	public static void main(String[] args) throws Exception {
		int exitCode = ToolRunner.run(new ModuleMapReduce(), args);
		System.exit(exitCode);
	}
}

分享到：

MapReduce 两列数据升序排列 | Linux mint17.2 安装输入法

2015-08-05 11:33
浏览 572
评论(0)
分类:企业架构
查看更多

发表评论

您还没有登录,请您登录后再发表评论

最近访客更多访客>>

博主相关

文章分类

社区版块

存档分类

最新评论

MapReduce编程模板

评论

发表评论

相关推荐

最近访客 更多访客>>

博主相关

文章分类

社区版块

存档分类

最新评论

MapReduce编程模板

评论

发表评论

相关推荐

MapReduce工作原理

Flume数据收集

Hive CLI

HBase集群搭建

HBase简介（很好的梳理资料）

sqoop数据的导入和导出

Combiner

MapReduce统计手机上网流量

hadoop 2.2.0 伪分布安装

Hive And MySQL安装及设置

HBase Shell And JavaAPI使用

伪分布环境安装HBase

分布式环境ZooKeeper3.4.5安装和JavaAPI

VirtualBox+Centos6.4搭建Hadoop1.1.2分布式环境

Hadoop MapReduce入门

编写WordCount程序

YF hadoop笔记

Hadoop hdfs-site.xml文件常用配置

HDFS基本概念

HDFS FileSystem常用方法

最近访客更多访客>>