eclipse设置运行在yarn上后失败，不设置就可以运行

跟帖没人回答，只好发帖求助。在hadoop2.4.1伪分布环境中，用MyEclipse10和相应的插件，运行hadoop自带的WordCount程序，先前出现”/bin/bash: line 0: fg: no job control"，按照论坛里的方法重新编译了YARNRunner类，然后就总是出现以下错误：

用了各种方法，比如在mapred-site.xml和yarn-site.xml中设置“mapreduce.application.classpath"属性，但都没有解决上述问题，请问哪位可以帮忙解决一下。WordCount程序中的main方法如下：
public static void main(String[] args) throws Exception {
            Configuration conf = new Configuration();
            conf.set("mapreduce.framework.name", "yarn");
            conf.set("yarn.resourcemanager.address", "10.35.1.177:8032");
            args=new String[2];
            args[0]="hdfs://10.35.1.177:9000/test/aa";
            args[1]="hdfs://10.35.1.177:9000/test/output";
            String[] otherArgs = new GenericOptionsParser(conf, args)
                              .getRemainingArgs();
            if (otherArgs.length != 2) {
                     System.err.println("Usage: wordcount <in> <out>");
                     System.exit(2);
            }
            Job job = new Job(conf, "word count");
            job.setJarByClass(WordCount.class);
            job.setMapperClass(TokenizerMapper.class);
            job.setCombinerClass(IntSumReducer.class);
            job.setReducerClass(IntSumReducer.class);
            job.setOutputKeyClass(Text.class);
            job.setOutputValueClass(IntWritable.class);
            FileInputFormat.addInputPath(job, new Path(otherArgs[0]));
            FileOutputFormat.setOutputPath(job, new Path(otherArgs[1]));
            System.exit(job.waitForCompletion(true) ? 0 : 1);
}

sstutu · 发表于 2014-8-7 09:22:45

看看自己哪里需要改进，只能帮你再次确认一下：

具体步骤，改写YARNRunner源码中的一些方法（YARNRunner.java源码类在hadoop-mapreduce-client-jobclient的maven项目中的org.apache.hadoop.mapred包下）需要在src下建同样的包名，类名，覆盖原来jar包里面自带的类。

YarnRunner.java的390行（Apache Hadoop2.2的源码）

// Setup the command to run the AM  
    List<String> vargs = new ArrayList<String>(8);  
    vargs.add(Environment.JAVA_HOME.$() + "/bin/java");  
复制代码

改为

vargs.add("$JAVA_HOME/bin/java");  
复制代码

在YarnRunner.java类中，新增一个路径转换的方法

private void replaceEnvironment(Map<String, String> environment) {  
      String tmpClassPath = environment.get("CLASSPATH");  
      tmpClassPath=tmpClassPath.replaceAll(";", ":");  
      tmpClassPath=tmpClassPath.replaceAll("%PWD%", "\\$PWD");  
      tmpClassPath=tmpClassPath.replaceAll("%HADOOP_MAPRED_HOME%", "\\$HADOOP_MAPRED_HOME");  
      tmpClassPath= tmpClassPath.replaceAll("\\\", "/" );  
      environment.put("CLASSPATH",tmpClassPath);  
}  
复制代码

在YarnRunner.java的在466行添加：

replaceEnvironment(environment);  
复制代码

通过，这样设置后，原来的异常就得到解决了，在这里分布式测试的例子依旧是hellow world，源码如下：

package com.qin.wordcount;

import java.io.IOException;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.YARNRunner;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;

/***
 * 
 * Hadoop2.2.0完全分布式测试
 * 放WordCount的例子
 * 
 * @author qindongliang
 * 
 * hadoop技术交流群：  376932160
 * 
 * 
 * */
public class MyWordCount {
        
        
        /**
         * Mapper
         * 
         * **/
        private static class WMapper extends Mapper<LongWritable, Text, Text, IntWritable>{
                
                
                private IntWritable count=new IntWritable(1);
                private Text text=new Text();
                @Override
                protected void map(LongWritable key, Text value,Context context)
                                throws IOException, InterruptedException {
                        String values[]=value.toString().split("#");
                        //System.out.println(values[0]+"========"+values[1]);
                        count.set(Integer.parseInt(values[1]));
                        text.set(values[0]);
                        context.write(text,count);
                        
                }
                
        }
        
        /**
         * Reducer
         * 
         * **/
        private static class WReducer extends Reducer<Text, IntWritable, Text, Text>{
                
                private Text t=new Text();
                @Override
                protected void reduce(Text key, Iterable<IntWritable> value,Context context)
                                throws IOException, InterruptedException {
                        int count=0;
                        for(IntWritable i:value){
                                count+=i.get();
                        }
                        t.set(count+"");
                        context.write(key,t);
                        
                }
                
        }
        
        
        /**
         * 改动一
         * (1)shell源码里添加checkHadoopHome的路径
         * (2)974行，FileUtils里面
         * **/
        
        public static void main(String[] args) throws Exception{
                
                
                Configuration conf=new Configuration();
                
            conf.set("mapreduce.job.jar", "myjob.jar");
                conf.set("fs.defaultFS","hdfs://192.168.46.28:9000");
                conf.set("mapreduce.framework.name", "yarn");  
                conf.set("yarn.resourcemanager.address", "192.168.46.28:8032"); 
                /**Job任务**/
           //Job job=new Job(conf, "testwordcount");//废弃此API
           Job job=Job.getInstance(conf, "new api");
                job.setJarByClass(MyWordCount.class);
                System.out.println("模式：  "+conf.get("mapreduce.jobtracker.address"));;
                // job.setCombinerClass(PCombine.class);
        
                 
                 
                // job.setNumReduceTasks(3);//设置为3
                 job.setMapperClass(WMapper.class);
                 job.setReducerClass(WReducer.class);
                 job.setInputFormatClass(TextInputFormat.class);
                 job.setOutputFormatClass(TextOutputFormat.class);
 
         
                
                 job.setMapOutputKeyClass(Text.class);
                 job.setMapOutputValueClass(IntWritable.class);
                 job.setOutputKeyClass(Text.class);
                 job.setOutputValueClass(Text.class);
        
                        String path="hdfs://192.168.46.28:9000/qin/output";
                        FileSystem fs=FileSystem.get(conf);
                        Path p=new Path(path);
                        if(fs.exists(p)){
                                fs.delete(p, true);
                                System.out.println("输出路径存在，已删除！");
                        }
                FileInputFormat.setInputPaths(job, "hdfs://192.168.46.28:9000/qin/input");
                FileOutputFormat.setOutputPath(job,p );
                System.exit(job.waitForCompletion(true) ? 0 : 1);  
                
                
                
                
        }
        

}
复制代码

在运行的时候，需要注意把，hadoop集群上的配置文件core-site.xml,hdfs-site.xml,mapred-site.xml,yarn-site.xml文件拷贝到src的根目录下，最好也放一个log4j.xml方便查看日志。并在mapred-site.xml里面，添加如下属性：

 <name>mapred.remote.os</name> 

 <value>Linux</value> 

<description>RemoteMapReduce framework's OS, can be either Linux orWindows</description> 

 </property>
复制代码

然后，把项目打成jar包，运行提交作业，控制台打印内容如下：

模式：  hp1:8021
输出路径存在，已删除！
INFO - RMProxy.createRMProxy(56) | Connecting to ResourceManager at /192.168.46.28:8032
WARN - JobSubmitter.copyAndConfigureFiles(149) | Hadoop command-line option parsing not performed. Implement the Tool interface and execute your application with ToolRunner to remedy this.
INFO - FileInputFormat.listStatus(287) | Total input paths to process : 1
INFO - JobSubmitter.submitJobInternal(394) | number of splits:1
INFO - Configuration.warnOnceIfDeprecated(840) | user.name is deprecated. Instead, use mapreduce.job.user.name
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.jar is deprecated. Instead, use mapreduce.job.jar
INFO - Configuration.warnOnceIfDeprecated(840) | fs.default.name is deprecated. Instead, use fs.defaultFS
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.output.value.class is deprecated. Instead, use mapreduce.job.output.value.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.mapoutput.value.class is deprecated. Instead, use mapreduce.map.output.value.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapreduce.map.class is deprecated. Instead, use mapreduce.job.map.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.job.name is deprecated. Instead, use mapreduce.job.name
INFO - Configuration.warnOnceIfDeprecated(840) | mapreduce.reduce.class is deprecated. Instead, use mapreduce.job.reduce.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapreduce.inputformat.class is deprecated. Instead, use mapreduce.job.inputformat.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.input.dir is deprecated. Instead, use mapreduce.input.fileinputformat.inputdir
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.output.dir is deprecated. Instead, use mapreduce.output.fileoutputformat.outputdir
INFO - Configuration.warnOnceIfDeprecated(840) | mapreduce.outputformat.class is deprecated. Instead, use mapreduce.job.outputformat.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.map.tasks is deprecated. Instead, use mapreduce.job.maps
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.output.key.class is deprecated. Instead, use mapreduce.job.output.key.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.mapoutput.key.class is deprecated. Instead, use mapreduce.map.output.key.class
INFO - Configuration.warnOnceIfDeprecated(840) | mapred.working.dir is deprecated. Instead, use mapreduce.job.working.dir
INFO - JobSubmitter.printTokens(477) | Submitting tokens for job: job_1402492118962_0004
INFO - YarnClientImpl.submitApplication(174) | Submitted application application_1402492118962_0004 to ResourceManager at /192.168.46.28:8032
INFO - Job.submit(1272) | The url to track the job: http://hp1:8088/proxy/application_1402492118962_0004/
INFO - Job.monitorAndPrintJob(1317) | Running job: job_1402492118962_0004
INFO - Job.monitorAndPrintJob(1338) | Job job_1402492118962_0004 running in uber mode : false
INFO - Job.monitorAndPrintJob(1345) |  map 0% reduce 0%
INFO - Job.monitorAndPrintJob(1345) |  map 100% reduce 0%
INFO - Job.monitorAndPrintJob(1345) |  map 100% reduce 100%
INFO - Job.monitorAndPrintJob(1356) | Job job_1402492118962_0004 completed successfully
INFO - Job.monitorAndPrintJob(1363) | Counters: 43
        File System Counters
                FILE: Number of bytes read=58
                FILE: Number of bytes written=159667
                FILE: Number of read operations=0
                FILE: Number of large read operations=0
                FILE: Number of write operations=0
                HDFS: Number of bytes read=147
                HDFS: Number of bytes written=27
                HDFS: Number of read operations=6
                HDFS: Number of large read operations=0
                HDFS: Number of write operations=2
        Job Counters 
                Launched map tasks=1
                Launched reduce tasks=1
                Data-local map tasks=1
                Total time spent by all maps in occupied slots (ms)=6155
                Total time spent by all reduces in occupied slots (ms)=4929
        Map-Reduce Framework
                Map input records=4
                Map output records=4
                Map output bytes=44
                Map output materialized bytes=58
                Input split bytes=109
                Combine input records=0
                Combine output records=0
                Reduce input groups=3
                Reduce shuffle bytes=58
                Reduce input records=4
                Reduce output records=3
                Spilled Records=8
                Shuffled Maps =1
                Failed Shuffles=0
                Merged Map outputs=1
                GC time elapsed (ms)=99
                CPU time spent (ms)=1060
                Physical memory (bytes) snapshot=309071872
                Virtual memory (bytes) snapshot=1680531456
                Total committed heap usage (bytes)=136450048
        Shuffle Errors
                BAD_ID=0
                CONNECTION=0
                IO_ERROR=0
                WRONG_LENGTH=0
                WRONG_MAP=0
                WRONG_REDUCE=0
        File Input Format Counters 
                Bytes Read=38
        File Output Format Counters 
                Bytes Written=27
复制代码

chenyang · 发表于 2014-8-7 09:43:35

sstutu 发表于 2014-8-7 09:22
看看自己哪里需要改进，只能帮你再次确认一下：

hadoop2.4.1的YARNRunner类和hadoop2.2不一样，这样修改是否有啥其他问题？另外，用该方法是针对修复”/bin/bash: line 0: fg: no job control"问题吧。

sstutu · 发表于 2014-8-7 09:59:00

chenyang 发表于 2014-8-7 09:43
hadoop2.4.1的YARNRunner类和hadoop2.2不一样，这样修改是否有啥其他问题？另外，用该方法是针对修复”/b ...

这个是尝试解决你的问题的，像下面这些，还有你的程序，最好也看看。跟别的地方哪里有所不同

Configuration conf=new Configuration();
conf.set("mapreduce.job.jar", "myjob.jar");
conf.set("fs.defaultFS","hdfs://192.168.46.28:9000");
conf.set("mapreduce.framework.name", "yarn");
conf.set("yarn.resourcemanager.address", "192.168.46.28:8032");

chenyang · 发表于 2014-8-7 10:14:37

sstutu 发表于 2014-8-7 09:59
这个是尝试解决你的问题的，像下面这些，还有你的程序，最好也看看。跟别的地方哪里有所不同

Configur ...

压缩jar后放在Linux后可以正常运行，但在Myclipse环境下就不能运行，说明程序是没多大问题的，只是windows连接Linux配置没设置好。

desehawk · 发表于 2014-8-7 11:06:33

本帖最后由 desehawk 于 2014-8-7 11:08 编辑

chenyang 发表于 2014-8-7 10:14
压缩jar后放在Linux后可以正常运行，但在Myclipse环境下就不能运行，说明程序是没多大问题的，只是window ...

为什么我就没有遇到你们的问题啊，是在什么环境下啊。
直接使用Eclipse插件链接不就行了吗？当然还需要

hadoop.dll
winutils.exe

chenyang · 发表于 2014-8-7 12:21:14

desehawk 发表于 2014-8-7 11:06
本帖最后由 desehawk 于 2014-8-7 11:08 编辑

为什么我就没有遇到你们的问题啊，是在什么环境下啊。

用了hadoop-common-2.2.0-bin.rar压缩包的这两个文件了，不用这两个文件会报但还是报错。
环境：
CentOS 6.4- 64位，Hadoop2.4.1伪分布，MyEclipse编程是在windows32位下，插件是根据hadoop2.4.1安装包生成的插件。

chenyang · 发表于 2014-8-7 12:41:07

desehawk 发表于 2014-8-7 11:06
本帖最后由 desehawk 于 2014-8-7 11:08 编辑

为什么我就没有遇到你们的问题啊，是在什么环境下啊。

你的是什么版本啊？

desehawk · 发表于 2014-8-7 14:11:00

chenyang 发表于 2014-8-7 12:41
你的是什么版本啊？

我的是hadoop2.2 Ubuntu
win7 64 Eclipse下面，但是我见到网上2.2也有类似的问题，但是我怎么没有遇到那

chenyang · 发表于 2014-8-7 14:52:56

本帖最后由 chenyang 于 2014-8-7 14:55 编辑

sstutu 发表于 2014-8-7 09:59
这个是尝试解决你的问题的，像下面这些，还有你的程序，最好也看看。跟别的地方哪里有所不同

Configur ...

错误日志如下，报出没找到相关的类，在配置yarn-site.xml中增加了"yarn.application.classpath"参数也不起作用啊。

Exception in thread "main" java.lang.NoClassDefFoundError: org/apache/hadoop/service/CompositeService
        at java.lang.ClassLoader.defineClass1(Native Method)
        at java.lang.ClassLoader.defineClass(ClassLoader.java:800)
        at java.security.SecureClassLoader.defineClass(SecureClassLoader.java:142)
        at java.net.URLClassLoader.defineClass(URLClassLoader.java:449)
        at java.net.URLClassLoader.access$100(URLClassLoader.java:71)
        at java.net.URLClassLoader$1.run(URLClassLoader.java:361)
        at java.net.URLClassLoader$1.run(URLClassLoader.java:355)
        at java.security.AccessController.doPrivileged(Native Method)
        at java.net.URLClassLoader.findClass(URLClassLoader.java:354)
        at java.lang.ClassLoader.loadClass(ClassLoader.java:425)
        at sun.misc.Launcher$AppClassLoader.loadClass(Launcher.java:308)
        at java.lang.ClassLoader.loadClass(ClassLoader.java:358)
        at sun.launcher.LauncherHelper.checkAndLoadMain(LauncherHelper.java:482)
Caused by: java.lang.ClassNotFoundException: org.apache.hadoop.service.CompositeService
        at java.net.URLClassLoader$1.run(URLClassLoader.java:366)
        at java.net.URLClassLoader$1.run(URLClassLoader.java:355)
        at java.security.AccessController.doPrivileged(Native Method)
        at java.net.URLClassLoader.findClass(URLClassLoader.java:354)
        at java.lang.ClassLoader.loadClass(ClassLoader.java:425)
        at sun.misc.Launcher$AppClassLoader.loadClass(Launcher.java:308)
        at java.lang.ClassLoader.loadClass(ClassLoader.java:358)
        ... 13 more
 
复制代码

图文精华

eclipse设置运行在yarn上后失败，不设置就可以运行

已有(11)人评论

活跃会员

热心会员

优秀版主

推荐 /2