hadoop2.2的mapreduce问题

public class WordCountTx {
public static class MapClass extends MapReduceBase
implements Mapper<LongWritable, Text, Text, IntWritable> {

private final static IntWritable one = new IntWritable(1);
private Text word = new Text();

   @Override
   public void map(LongWritable key, Text value,
                  OutputCollector<Text, IntWritable> output,
         Reporter reporter) throws IOException {
            String line = value.toString();
            StringTokenizer itr = new StringTokenizer(line);
            while (itr.hasMoreTokens()) {
                  word.set(itr.nextToken());
                  output.collect(word, one);
            }
  }
  }

  public static class Reduce extends MapReduceBase
implements Reducer<Text, IntWritable, Text, IntWritable> {

   @Override
public void reduce(Text key, Iterator<IntWritable> values,
                     OutputCollector<Text, IntWritable> output,
                     Reporter reporter) throws IOException {
   int sum = 0;
   while (values.hasNext()) {
      sum += values.next().get();
   }
   output.collect(key, new IntWritable(sum));
}
  }

  public static void main(String[] args) throws Exception {

      JobConf conf = new JobConf(WordCountTx.class);
      // hdfs地址
      conf.set("fs.default.name", "hdfs://192.168.1.238:9000");
      conf.set("mapred.job.tracker","hdfs://192.168.1.238:9009");
      // 设置jar
      File jarFile = EightSpaceJob.createTempJar("bin");

      EightSpaceJob.addClasspath("/usr/hadoop/etc/hadoop");

      ClassLoader classLoader = EightSpaceJob.getClassLoader();

      Thread.currentThread().setContextClassLoader(classLoader);

      conf.setJar(jarFile.toString());

      conf.setJobName("wordcounttxt");

      conf.setOutputKeyClass(Text.class);
      conf.setOutputValueClass(IntWritable.class);

      conf.setMapperClass(MapClass.class);
      conf.setReducerClass(Reduce.class);

      FileInputFormat.setInputPaths(conf, new Path("/inpath/txttest"));
      FileOutputFormat.setOutputPath(conf, new Path("/logAalyse"));

      JobClient.runJob(conf);
  }
}
上边的代码是我写的，大家看看有什么问题，然后运行的时候报错如下
log4j:WARN No appenders could be found for logger (org.apache.hadoop.conf.Configuration.deprecation).
log4j:WARN Please initialize the log4j system properly.
log4j:WARN See http://logging.apache.org/log4j/1.2/faq.html#noconfig for more info.
Exception in thread "main" java.io.IOException: Cannot initialize Cluster. Please check your configuration for mapreduce.framework.name and the correspond server addresses.
at org.apache.hadoop.mapreduce.Cluster.initialize(Cluster.java:120)
at org.apache.hadoop.mapreduce.Cluster.<init>(Cluster.java:82)
at org.apache.hadoop.mapreduce.Cluster.<init>(Cluster.java:75)
at org.apache.hadoop.mapred.JobClient.init(JobClient.java:470)
at org.apache.hadoop.mapred.JobClient.<init>(JobClient.java:449)
at org.apache.hadoop.mapred.JobClient.runJob(JobClient.java:832)
at com.eightsapce.mapreducetxt.WordCountTx.main(WordCountTx.java:96)

有妳很满促 · 发表于 2013-12-16 12:50:08

public class WordCountTx {
public static class MapClass extends MapReduceBase
implements Mapper<LongWritable, Text, Text, IntWritable> {

private final static IntWritable one = new IntWritable(1);
private Text word = new Text();

   @Override
   public void map(LongWritable key, Text value,
                  OutputCollector<Text, IntWritable> output,
         Reporter reporter) throws IOException {
            String line = value.toString();
            StringTokenizer itr = new StringTokenizer(line);
            while (itr.hasMoreTokens()) {
                  word.set(itr.nextToken());
                  output.collect(word, one);
            }
  }
  }

  public static class Reduce extends MapReduceBase
implements Reducer<Text, IntWritable, Text, IntWritable> {

   @Override
public void reduce(Text key, Iterator<IntWritable> values,
                     OutputCollector<Text, IntWritable> output,
                     Reporter reporter) throws IOException {
   int sum = 0;
   while (values.hasNext()) {
      sum += values.next().get();
   }
   output.collect(key, new IntWritable(sum));
}
  }

  public static void main(String[] args) throws Exception {

      JobConf conf = new JobConf(WordCountTx.class);
      // hdfs地址
      conf.set("fs.default.name", "hdfs://192.168.1.238:9000");
      conf.set("mapred.job.tracker","hdfs://192.168.1.238:9009");
      // 设置jar
      File jarFile = EightSpaceJob.createTempJar("bin");

      EightSpaceJob.addClasspath("/usr/hadoop/etc/hadoop");

      ClassLoader classLoader = EightSpaceJob.getClassLoader();

      Thread.currentThread().setContextClassLoader(classLoader);

      conf.setJar(jarFile.toString());

      conf.setJobName("wordcounttxt");

      conf.setOutputKeyClass(Text.class);
      conf.setOutputValueClass(IntWritable.class);

      conf.setMapperClass(MapClass.class);
      conf.setReducerClass(Reduce.class);

      FileInputFormat.setInputPaths(conf, new Path("/inpath/txttest"));
      FileOutputFormat.setOutputPath(conf, new Path("/logAalyse"));

      JobClient.runJob(conf);
  }
}
上边的代码是我写的，大家看看有什么问题，然后运行的时候报错如下
log4j:WARN No appenders could be found for logger (org.apache.hadoop.conf.Configuration.deprecation).
log4j:WARN Please initialize the log4j system properly.
log4j:WARN See http://logging.apache.org/log4j/1.2/faq.html#noconfig for more info.
Exception in thread "main" java.io.IOException: Cannot initialize Cluster. Please check your configuration for mapreduce.framework.name and the correspond server addresses.
      at org.apache.hadoop.mapreduce.Cluster.initialize(Cluster.java:120)
      at org.apache.hadoop.mapreduce.Cluster.<init>(Cluster.java:82)
      at org.apache.hadoop.mapreduce.Cluster.<init>(Cluster.java:75)
      at org.apache.hadoop.mapred.JobClient.init(JobClient.java:470)
      at org.apache.hadoop.mapred.JobClient.<init>(JobClient.java:449)
      at org.apache.hadoop.mapred.JobClient.runJob(JobClient.java:832)
      at com.eightsapce.mapreducetxt.WordCountTx.main(WordCountTx.java:96)

lzw · 发表于 2013-12-16 14:07:38

有妳很满促发表于 2013-12-16 12:50

你是在eclipse中运行的还是用hadoop jar命令执行的。

lzw · 发表于 2013-12-16 14:19:24

我发现这个代码也不是haoop2.2.0的吧，应该是1.0之前的版本。

有妳很满促 · 发表于 2013-12-17 12:05:50

lzw 发表于 2013-12-16 14:07
你是在eclipse中运行的还是用hadoop jar命令执行的。

在eclipse中运行

有妳很满促 · 发表于 2013-12-17 12:06:38

lzw 发表于 2013-12-16 14:19
我发现这个代码也不是haoop2.2.0的吧，应该是1.0之前的版本。

我看网上说2.x和1.x代码一样啊

lzw · 发表于 2013-12-17 12:44:17

有妳很满促发表于 2013-12-17 12:06
我看网上说2.x和1.x代码一样啊

上面举的例子既不是1.0.x，也不是2.0.x版本的。

有妳很满促 · 发表于 2013-12-18 12:05:09

lzw 发表于 2013-12-17 12:44
上面举的例子既不是1.0.x，也不是2.0.x版本的。

那你有那个2.x的例子不

lzw · 发表于 2013-12-18 21:15:16

有妳很满促发表于 2013-12-18 12:05
那你有那个2.x的例子不

新建3个类文件，代码依次如下：Mapper 类：MaxTemperatureMapper.java

importjava.io.IOException; 

importorg.apache.hadoop.io.IntWritable;

importorg.apache.hadoop.io.LongWritable;

importorg.apache.hadoop.io.Text;

importorg.apache.hadoop.mapreduce.Mapper;

 

public class MaxTemperatureMapper extends Mapper<LongWritable, Text,Text, IntWritable> { 

         @Override

         public void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException{                                    

                   String line =value.toString();                               

                   try {

                            String year =line.substring(0,4);

                            int airTemperature = Integer.parseInt(line.substring(5));            

                            context.write(new Text(year),new IntWritable(airTemperature));                           

                   } catch (Exception e) {

                            System.out.print("Error in line:" + line);

                   }                                  

         }        

}
复制代码

Reducer类：MaxTemperatureReducer.java
importjava.io.IOException; importorg.apache.hadoop.io.IntWritable; importorg.apache.hadoop.io.Text; importorg.apache.hadoop.mapreduce.Reducer; public class MaxTemperatureReducer extendsReducer<Text,IntWritable,Text,IntWritable> { @Override public void reduce(Text key, Iterable<IntWritable> values, Context context)throws IOException, InterruptedException { int maxValue = Integer.MIN_VALUE; for(IntWritable value: values){ maxValue = Math.max(maxValue,value.get()); } context.write(key, new IntWritable(maxValue)); } } 复制代码

主类：MaxTemperatureDriver.java

importorg.apache.hadoop.conf.Configuration; importorg.apache.hadoop.conf.Configured; importorg.apache.hadoop.fs.Path; importorg.apache.hadoop.io.IntWritable; importorg.apache.hadoop.io.Text; importorg.apache.hadoop.mapreduce.lib.input.FileInputFormat; importorg.apache.hadoop.mapreduce.lib.output.FileOutputFormat; importorg.apache.hadoop.mapreduce.Job; importorg.apache.hadoop.util.Tool; importorg.apache.hadoop.util.ToolRunner; public class MaxTemperatureDriver extends Configuredimplements Tool { @SuppressWarnings("deprecation") @Override public int run(String[] args) throwsException { if (args.length != 2){ System.err.printf("Usage: %s <input><output>",getClass().getSimpleName()); ToolRunner.printGenericCommandUsage(System.err); return -1; } Configuration conf =getConf(); Job job = newJob(getConf()); job.setJobName("Max Temperature"); job.setJarByClass(getClass()); FileInputFormat.addInputPath(job,new Path(args[0])); FileOutputFormat.setOutputPath(job,new Path(args[1])); job.setMapperClass(MaxTemperatureMapper.class); job.setReducerClass(MaxTemperatureReducer.class); job.setOutputKeyClass(Text.class); job.setOutputValueClass(IntWritable.class); return job.waitForCompletion(true)?0:1; } public static void main(String[] args)throws Exception{ int exitcode = ToolRunner.run(new MaxTemperatureDriver(), args); System.exit(exitcode); } } 复制代码