eclipse环境下，mapreduce发送到集群运行

最新推荐文章于 2021-12-01 09:02:42 发布

apache-bbccb

最新推荐文章于 2021-12-01 09:02:42 发布

阅读量572

点赞数

分类专栏： hadoop

本文链接：https://blog.csdn.net/xgskj/article/details/40543413

版权

hadoop 专栏收录该内容

28 篇文章 0 订阅

订阅专栏

<pre name="code" class="java">package com.test;

import java.io.File;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
import java.util.jar.JarEntry;
import java.util.jar.JarOutputStream;
import java.util.jar.Manifest;

public class JarTool {

	public static File createTempJar(String root) throws IOException {
		if (!new File(root).exists()) {
			return null;
		}
		// 创建manifest文件
		Manifest manifest = new Manifest();
		// 设置主属性
		manifest.getMainAttributes().putValue("Manifest-Version", "1.0");
		// 创建临时文件
		final File jarFile = File.createTempFile("EJar-", ".jar", new File(System.getProperty("java.io.tmpdir")));
		Runtime.getRuntime().addShutdownHook(new Thread() {
			public void run() {
				jarFile.delete();
			}
		});
		// 创建Jar文件输出流
		JarOutputStream out = new JarOutputStream(new FileOutputStream(jarFile), manifest);
		createTempJarInner(out, new File(root), "");
		out.flush();
		out.close();
		return jarFile;

	}

	// 遍历目录下文件
	private static void createTempJarInner(JarOutputStream out, File f,
			String base) throws IOException {
		if (f.isDirectory()) {
			File[] fl = f.listFiles();
			if (base.length() > 0) {
				base = base + "/";
			}
			for (int i = 0; i < fl.length; i++) {
				createTempJarInner(out, fl[i], base + fl[i].getName());
			}
		} else {
			out.putNextEntry(new JarEntry(base));
			FileInputStream in = new FileInputStream(f);
			byte[] buffer = new byte[1024];
			int n = in.read(buffer);
			while (n != -1) {
				out.write(buffer, 0, n);
				n = in.read(buffer);
			}
			in.close();
		}
	}

	/*public static void addClasspath(String component) {
		if ((component != null) && (component.length() > 0)) {
			try {
				File f = new File(component);

				if (f.exists()) {
					URL key = f.getCanonicalFile().toURL();
					if (!classPath.contains(key)) {

						classPath.add(key);
					}
				}

			} catch (IOException e) {
			}
		}
	}*/

}


package com.test;

import java.io.File;
import java.io.IOException;
import java.net.URI;
import java.util.StringTokenizer;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;

public class WordCount {

	public static class TokenizerMapper extends
			Mapper<Object, Text, Text, IntWritable> {

		private final static IntWritable one = new IntWritable(1);
		private Text word = new Text();

		public void map(Object key, Text value, Context context)
				throws IOException, InterruptedException {
			StringTokenizer itr = new StringTokenizer(value.toString());
			while (itr.hasMoreTokens()) {
				word.set(itr.nextToken());
				context.write(word, one);
			}
		}
	}

	public static class IntSumReducer extends
			Reducer<Text, IntWritable, Text, IntWritable> {
		private IntWritable result = new IntWritable();

		public void reduce(Text key, Iterable<IntWritable> values,
				Context context) throws IOException, InterruptedException {
			int sum = 0;
			for (IntWritable val : values) {
				sum += val.get();
			}
			result.set(sum);
			context.write(key, result);
		}
	}

	public static void main(String[] args) throws Exception {

		String INPUT_PATH = "hdfs://linux:9000/input.txt";
		String OUT_PATH = "hdfs://linux:9000/output";
		
		Configuration conf = new Configuration(); 
		conf.set("mapred.job.tracker", "linux:9001");
//		conf.set("fs.default.name", "hdfs://linux:9000");

		Job job = new Job(conf); // 创建一个job，供JobTracker使用
		job.setJarByClass(WordCount.class);
		// ((JobConf) job.getConfiguration()).setJar("pr.jar");
		JarTool jobjar = new JarTool();
		File jarFile = jobjar.createTempJar("bin");
		((JobConf) job.getConfiguration()).setJar(jarFile.toString());
		job.setMapperClass(TokenizerMapper.class);
		job.setReducerClass(IntSumReducer.class);

		FileInputFormat.setInputPaths(job, new Path(INPUT_PATH));
		
		FileSystem fileSystem = FileSystem.get(new URI(OUT_PATH), conf);
		fileSystem.delete(new Path(OUT_PATH), true);
		FileOutputFormat.setOutputPath(job, new Path(OUT_PATH));
		job.setOutputKeyClass(Text.class);
		job.setOutputValueClass(IntWritable.class);
		job.waitForCompletion(true);
	}
}

apache-bbccb

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
eclipse环境下，mapreduce发送到集群运行

package com.zte.esb.utils;import java.io.File;import java.io.FileInputStream;import java.io.FileOutputStream;import java.io.IOException;import java.util.jar.JarEntry;import java.util.jar.JarOut
复制链接

扫一扫

专栏目录