| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package org.apache.hadoop.mapred.gridmix; |
| |
| import java.io.IOException; |
| |
| import org.apache.hadoop.conf.Configuration; |
| |
| /** |
| * Factory passing reduce specification as its last record. |
| */ |
| class IntermediateRecordFactory extends RecordFactory { |
| |
| private final GridmixKey.Spec spec; |
| private final RecordFactory factory; |
| private final int partition; |
| private final long targetRecords; |
| private boolean done = false; |
| private long accRecords = 0L; |
| |
| /** |
| * @param targetBytes Expected byte count. |
| * @param targetRecords Expected record count; will emit spec records after |
| * this boundary is passed. |
| * @param partition Reduce to which records are emitted. |
| * @param spec Specification to emit. |
| * @param conf Unused. |
| */ |
| public IntermediateRecordFactory(long targetBytes, long targetRecords, |
| int partition, GridmixKey.Spec spec, Configuration conf) { |
| this(new AvgRecordFactory(targetBytes, targetRecords, conf), partition, |
| targetRecords, spec, conf); |
| } |
| |
| /** |
| * @param factory Factory from which byte/record counts are obtained. |
| * @param partition Reduce to which records are emitted. |
| * @param targetRecords Expected record count; will emit spec records after |
| * this boundary is passed. |
| * @param spec Specification to emit. |
| * @param conf Unused. |
| */ |
| public IntermediateRecordFactory(RecordFactory factory, int partition, |
| long targetRecords, GridmixKey.Spec spec, Configuration conf) { |
| this.spec = spec; |
| this.factory = factory; |
| this.partition = partition; |
| this.targetRecords = targetRecords; |
| } |
| |
| @Override |
| public boolean next(GridmixKey key, GridmixRecord val) throws IOException { |
| assert key != null; |
| final boolean rslt = factory.next(key, val); |
| ++accRecords; |
| if (rslt) { |
| if (accRecords < targetRecords) { |
| key.setType(GridmixKey.DATA); |
| } else { |
| final int orig = key.getSize(); |
| key.setType(GridmixKey.REDUCE_SPEC); |
| spec.rec_in = accRecords; |
| key.setSpec(spec); |
| val.setSize(val.getSize() - (key.getSize() - orig)); |
| // reset counters |
| accRecords = 0L; |
| spec.bytes_out = 0L; |
| spec.rec_out = 0L; |
| done = true; |
| } |
| } else if (!done) { |
| // ensure spec emitted |
| key.setType(GridmixKey.REDUCE_SPEC); |
| key.setPartition(partition); |
| key.setSize(0); |
| val.setSize(0); |
| spec.rec_in = 0L; |
| key.setSpec(spec); |
| done = true; |
| return true; |
| } |
| key.setPartition(partition); |
| return rslt; |
| } |
| |
| @Override |
| public float getProgress() throws IOException { |
| return factory.getProgress(); |
| } |
| |
| @Override |
| public void close() throws IOException { |
| factory.close(); |
| } |
| } |