/examples/treasury_yield/src/main/java/com/mongodb/hadoop/examples/treasury/TreasuryYieldXMLConfigV2.java

https://gitlab.com/mkgobaco/mongo-hadoop · Java · 107 lines · 75 code · 14 blank · 18 comment · 1 complexity · 1960ae7018257a3ce5f2df177e9ef1bd MD5 · raw file

  1. /*
  2. * Copyright 2011 10gen Inc.
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. package com.mongodb.hadoop.examples.treasury;
  17. import com.mongodb.hadoop.io.BSONWritable;
  18. import com.mongodb.hadoop.mapred.MongoInputFormat;
  19. import com.mongodb.hadoop.mapred.MongoOutputFormat;
  20. import com.mongodb.hadoop.util.MongoConfigUtil;
  21. import org.apache.commons.logging.Log;
  22. import org.apache.commons.logging.LogFactory;
  23. import org.apache.hadoop.conf.Configuration;
  24. import org.apache.hadoop.conf.Configured;
  25. import org.apache.hadoop.io.DoubleWritable;
  26. import org.apache.hadoop.io.IntWritable;
  27. import org.apache.hadoop.mapred.JobClient;
  28. import org.apache.hadoop.mapred.JobConf;
  29. import org.apache.hadoop.mapred.MapReduceBase;
  30. import org.apache.hadoop.mapred.Mapper;
  31. import org.apache.hadoop.mapred.OutputCollector;
  32. import org.apache.hadoop.mapred.Reducer;
  33. import org.apache.hadoop.mapred.Reporter;
  34. import org.apache.hadoop.util.Tool;
  35. import org.apache.hadoop.util.ToolRunner;
  36. import org.bson.BasicBSONObject;
  37. import java.io.IOException;
  38. import java.util.Date;
  39. import java.util.Iterator;
  40. /**
  41. * The treasury yield xml config object.
  42. */
  43. public class TreasuryYieldXMLConfigV2 extends Configured implements Tool {
  44. private static final Log LOG = LogFactory.getLog(TreasuryYieldXMLConfigV2.class);
  45. static class TreasuryYieldMapperV2 extends MapReduceBase implements Mapper<BSONWritable, BSONWritable, IntWritable, DoubleWritable> {
  46. @Override
  47. @SuppressWarnings("deprecation")
  48. public void map(final BSONWritable key, final BSONWritable value, final OutputCollector<IntWritable, DoubleWritable> output,
  49. final Reporter reporter)
  50. throws IOException {
  51. final int year = ((Date) value.getDoc().get("_id")).getYear() + 1900;
  52. double bid10Year = ((Number) value.getDoc().get("bc10Year")).doubleValue();
  53. output.collect(new IntWritable(year), new DoubleWritable(bid10Year));
  54. }
  55. }
  56. static class TreasuryYieldReducerV2 extends MapReduceBase implements Reducer<IntWritable, DoubleWritable, IntWritable, BSONWritable> {
  57. @Override
  58. public void reduce(final IntWritable key, final Iterator<DoubleWritable> values,
  59. final OutputCollector<IntWritable, BSONWritable> output, final Reporter reporter) throws IOException {
  60. int count = 0;
  61. double sum = 0;
  62. while (values.hasNext()) {
  63. DoubleWritable value = values.next();
  64. sum += value.get();
  65. count++;
  66. }
  67. final double avg = sum / count;
  68. LOG.info("V2: Average 10 Year Treasury for " + key.get() + " was " + avg);
  69. BasicBSONObject outputObj = new BasicBSONObject();
  70. outputObj.put("count", count);
  71. outputObj.put("avg", avg);
  72. outputObj.put("sum", sum);
  73. output.collect(key, new BSONWritable(outputObj));
  74. }
  75. }
  76. public int run(final String[] args) throws Exception {
  77. final Configuration conf = getConf();
  78. final JobConf job = new JobConf(conf);
  79. job.setReducerClass(TreasuryYieldReducerV2.class);
  80. job.setMapperClass(TreasuryYieldMapperV2.class);
  81. job.setOutputFormat(MongoOutputFormat.class);
  82. job.setOutputKeyClass(MongoConfigUtil.getOutputKey(conf));
  83. job.setOutputValueClass(MongoConfigUtil.getOutputValue(conf));
  84. job.setMapOutputKeyClass(MongoConfigUtil.getMapperOutputKey(conf));
  85. job.setMapOutputValueClass(MongoConfigUtil.getMapperOutputValue(conf));
  86. job.setInputFormat(MongoInputFormat.class);
  87. JobClient.runJob(job);
  88. return 0;
  89. }
  90. public static void main(final String[] args) throws Exception {
  91. ToolRunner.run(new TreasuryYieldXMLConfigV2(), args);
  92. }
  93. }