hadoop IntermediateRecordFactory 源码

  • 2022-10-20
  • 浏览 (184)

haddop IntermediateRecordFactory 代码

文件路径:/hadoop-tools/hadoop-gridmix/src/main/java/org/apache/hadoop/mapred/gridmix/IntermediateRecordFactory.java

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.mapred.gridmix;

import java.io.IOException;

import org.apache.hadoop.conf.Configuration;

/**
 * Factory passing reduce specification as its last record.
 */
class IntermediateRecordFactory extends RecordFactory {

  private final GridmixKey.Spec spec;
  private final RecordFactory factory;
  private final int partition;
  private final long targetRecords;
  private boolean done = false;
  private long accRecords = 0L;

  /**
   * @param targetBytes Expected byte count.
   * @param targetRecords Expected record count; will emit spec records after
   *                      this boundary is passed.
   * @param partition Reduce to which records are emitted.
   * @param spec Specification to emit.
   * @param conf Unused.
   */
  public IntermediateRecordFactory(long targetBytes, long targetRecords,
      int partition, GridmixKey.Spec spec, Configuration conf) {
    this(new AvgRecordFactory(targetBytes, targetRecords, conf), partition,
        targetRecords, spec, conf);
  }

  /**
   * @param factory Factory from which byte/record counts are obtained.
   * @param partition Reduce to which records are emitted.
   * @param targetRecords Expected record count; will emit spec records after
   *                      this boundary is passed.
   * @param spec Specification to emit.
   * @param conf Unused.
   */
  public IntermediateRecordFactory(RecordFactory factory, int partition,
      long targetRecords, GridmixKey.Spec spec, Configuration conf) {
    this.spec = spec;
    this.factory = factory;
    this.partition = partition;
    this.targetRecords = targetRecords;
  }

  @Override
  public boolean next(GridmixKey key, GridmixRecord val) throws IOException {
    assert key != null;
    final boolean rslt = factory.next(key, val);
    ++accRecords;
    if (rslt) {
      if (accRecords < targetRecords) {
        key.setType(GridmixKey.DATA);
      } else {
        final int orig = key.getSize();
        key.setType(GridmixKey.REDUCE_SPEC);
        spec.rec_in = accRecords;
        key.setSpec(spec);
        val.setSize(val.getSize() - (key.getSize() - orig));
        // reset counters
        accRecords = 0L;
        spec.bytes_out = 0L;
        spec.rec_out = 0L;
        done = true;
      }
    } else if (!done) {
      // ensure spec emitted
      key.setType(GridmixKey.REDUCE_SPEC);
      key.setPartition(partition);
      key.setSize(0);
      val.setSize(0);
      spec.rec_in = 0L;
      key.setSpec(spec);
      done = true;
      return true;
    }
    key.setPartition(partition);
    return rslt;
  }

  @Override
  public float getProgress() throws IOException {
    return factory.getProgress();
  }

  @Override
  public void close() throws IOException {
    factory.close();
  }
}

相关信息

hadoop 源码目录

相关文章

hadoop AvgRecordFactory 源码

hadoop ClusterSummarizer 源码

hadoop CompressionEmulationUtil 源码

hadoop DistributedCacheEmulator 源码

hadoop EchoUserResolver 源码

hadoop ExecutionSummarizer 源码

hadoop FilePool 源码

hadoop FileQueue 源码

hadoop GenerateData 源码

hadoop GenerateDistCacheData 源码

0  赞