映射减少分布式缓存

时间:2014-06-15 12:14:11

标签: eclipse hadoop mapreduce distributed-caching distributed-cache

我无法在job.waitforcompletion(boolean)子句中编译我的DriverClass。它给了我一个NoClassFoundException。如果我捕获异常,run方法抛出它期望int值的错误。我正在使用MapReduce新的API。任何人都可以建议问题:

import java.io.File;
import java.io.IOException;
import java.net.URI;
import java.net.URISyntaxException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.filecache.DistributedCache;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.util.GenericOptionsParser;
import org.apache.hadoop.util.Tool;
import org.apache.hadoop.util.ToolRunner;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;


public class Dist_Driver extends Configured implements Tool {

    public int run(String args[]) throws IOException, InterruptedException {

        // Configuration phase
        // Configuration conf=new Configuration();
        Job job = new Job(new Configuration());
        job.setJarByClass(Dist_Driver.class);

        // Mapper Reducer InputFormat
        job.setInputFormatClass(FileInputFormat.class);
        // Mapper and Reducer Class
        job.setMapperClass(Dist_Mapper.class);
        job.setReducerClass(DistCache_Reducer.class);

        job.setOutputFormatClass(TextOutputFormat.class);
        job.setInputFormatClass(KeyValueTextInputFormat.class);
        // set FileInputOutput
        FileInputFormat.addInputPath(job, new Path(args[0]));
        FileOutputFormat.setOutputPath(job, new Path(args[1]));
        // setting number of reduce tasks and submit it
        job.setNumReduceTasks(2);

        // Lets check if the file exist
        File f1 = new File("/home/hdfs/trials_mapreduce_progams/emp_id");
        if (f1.exists())
            System.out.println("The Files Exists");
        else
            System.out.println("The File doesnot exist");
        URI path1;
        try {
            path1 = new URI(
                    "/home/hdfs/trials_mapreduce_progams/emp_lookup.txt");
            DistributedCache.addCacheFile(path1, job.getConfiguration());
        } catch (URISyntaxException e) {
            // TODO Auto-generated catch block
            e.printStackTrace();
        }

        if (job.waitForCompletion(true))
            return 0;
        else
            return 1;

    }

    public static void main(String[] args) throws Exception {

        int exitcode = ToolRunner.run(new Dist_Driver(), args);
        System.exit(exitcode);

    }

}

1 个答案:

答案 0 :(得分:0)

只需将ClassNotFoundException添加到run方法签名

即可
public int run(String args[]) throws IOException, 
                                     InterruptedException, 
                                     ClassNotFoundException {

当您尝试try/catch时出现错误的原因是因为如果在执行期间抛出ClassNotFoundException,则没有返回值,并且方法具有返回一些东西。

如果你真的想抓住它,只需return 1子句中的catch,这是错误退出代码