Java RCFileOutputFormat Examples

Programming Language: Java

Namespace/Package Name: org.apache.hadoop.hive.ql.io

Examples at hotexamples.com: 1

Java RCFileOutputFormat - 1 examples found. These are the top rated real world Java examples of org.apache.hadoop.hive.ql.io.RCFileOutputFormat extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

setOutputPath(1)

Frequently Used Methods

setOutputPath (1)

Example #1

Show file

File: PartitionCompactor.java Project: Volney/Hive.Generate.DDL

  private static void compactASinglePartition(
      String existingInputPath,
      String deltaInputPath,
      String primaryKeyList,
      String maxColumns,
      String outputPath,
      String numberOfReducers)
      throws IOException {
    JobConf conf = new JobConf(new Configuration(), PartitionCompactor.class);

    // hadoop
    conf.setJobName("PartitionCompactor");
    conf.setOutputKeyClass(LongWritable.class);
    conf.setOutputValueClass(BytesRefArrayWritable.class);
    conf.setMapOutputKeyClass(Text.class);
    conf.setMapOutputValueClass(BytesRefArrayWritable.class);

    conf.setMapperClass(CustomMapper.class);
    conf.setReducerClass(CustomReducer.class);
    conf.setPartitionerClass(CustomPartitioner.class);
    conf.setInputFormat(RCFileInputFormat.class);

    conf.setNumReduceTasks(Integer.parseInt(numberOfReducers));

    conf.set(EXISTING_FILE_PATH_CONF, existingInputPath);
    conf.set(DELTA_FILE_PATH_CONF, deltaInputPath);
    conf.set(PRIMARY_KEYS_CONF, primaryKeyList);
    conf.set(RCFile.COLUMN_NUMBER_CONF_STR, maxColumns);

    RCFileInputFormat.addInputPath(conf, new Path(existingInputPath));
    RCFileInputFormat.addInputPath(conf, new Path(deltaInputPath));

    conf.setOutputFormat(RCFileOutputFormat.class);
    RCFileOutputFormat.setOutputPath(conf, new Path(outputPath));

    RunningJob job = JobClient.runJob(conf);
    job.waitForCompletion();
  }