hudi-client/hudi-spark-client/src/main/java/org/apache/hudi/table/action/commit/BaseSparkCommitActionExecutor.java - hudi

blob: 36cca8cd1403c5fe6ced6d0b42aa6684081520d7 [file] [log] [blame]

	/*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package org.apache.hudi.table.action.commit;

	import org.apache.hudi.client.WriteStatus;
	import org.apache.hudi.client.utils.SparkMemoryUtils;
	import org.apache.hudi.client.common.HoodieEngineContext;
	import org.apache.hudi.common.model.HoodieBaseFile;
	import org.apache.hudi.common.model.HoodieCommitMetadata;
	import org.apache.hudi.common.model.HoodieKey;
	import org.apache.hudi.common.model.HoodieRecord;
	import org.apache.hudi.common.model.HoodieRecordLocation;
	import org.apache.hudi.common.model.HoodieRecordPayload;
	import org.apache.hudi.common.model.HoodieWriteStat;
	import org.apache.hudi.common.model.WriteOperationType;
	import org.apache.hudi.common.table.timeline.HoodieActiveTimeline;
	import org.apache.hudi.common.table.timeline.HoodieInstant;
	import org.apache.hudi.common.util.CommitUtils;
	import org.apache.hudi.common.util.Option;
	import org.apache.hudi.common.util.collection.Pair;
	import org.apache.hudi.config.HoodieWriteConfig;
	import org.apache.hudi.exception.HoodieCommitException;
	import org.apache.hudi.exception.HoodieUpsertException;
	import org.apache.hudi.execution.SparkLazyInsertIterable;
	import org.apache.hudi.io.CreateHandleFactory;
	import org.apache.hudi.io.HoodieMergeHandle;
	import org.apache.hudi.io.HoodieSortedMergeHandle;
	import org.apache.hudi.table.HoodieSparkTable;
	import org.apache.hudi.table.HoodieTable;
	import org.apache.hudi.table.WorkloadProfile;
	import org.apache.hudi.table.WorkloadStat;
	import org.apache.hudi.table.action.HoodieWriteMetadata;
	import org.apache.log4j.LogManager;
	import org.apache.log4j.Logger;
	import org.apache.spark.Partitioner;
	import org.apache.spark.api.java.JavaPairRDD;
	import org.apache.spark.api.java.JavaRDD;
	import org.apache.spark.storage.StorageLevel;
	import scala.Tuple2;

	import java.io.IOException;
	import java.io.Serializable;
	import java.nio.charset.StandardCharsets;
	import java.time.Duration;
	import java.time.Instant;
	import java.util.Collections;
	import java.util.Comparator;
	import java.util.HashMap;
	import java.util.Iterator;
	import java.util.List;
	import java.util.Map;

	public abstract class BaseSparkCommitActionExecutor<T extends HoodieRecordPayload> extends
	BaseCommitActionExecutor<T, JavaRDD<HoodieRecord<T>>, JavaRDD<HoodieKey>, JavaRDD<WriteStatus>, HoodieWriteMetadata> {

	private static final Logger LOG = LogManager.getLogger(BaseSparkCommitActionExecutor.class);

	public BaseSparkCommitActionExecutor(HoodieEngineContext context,
	HoodieWriteConfig config,
	HoodieTable table,
	String instantTime,
	WriteOperationType operationType) {
	super(context, config, table, instantTime, operationType, Option.empty());
	}

	public BaseSparkCommitActionExecutor(HoodieEngineContext context,
	HoodieWriteConfig config,
	HoodieTable table,
	String instantTime,
	WriteOperationType operationType,
	Option extraMetadata) {
	super(context, config, table, instantTime, operationType, extraMetadata);
	}

	@Override
	public HoodieWriteMetadata<JavaRDD<WriteStatus>> execute(JavaRDD<HoodieRecord<T>> inputRecordsRDD) {
	HoodieWriteMetadata<JavaRDD<WriteStatus>> result = new HoodieWriteMetadata<>();
	// Cache the tagged records, so we don't end up computing both
	// TODO: Consistent contract in HoodieWriteClient regarding preppedRecord storage level handling
	if (inputRecordsRDD.getStorageLevel() == StorageLevel.NONE()) {
	inputRecordsRDD.persist(StorageLevel.MEMORY_AND_DISK_SER());
	} else {
	LOG.info("RDD PreppedRecords was persisted at: " + inputRecordsRDD.getStorageLevel());
	}

	WorkloadProfile profile = null;
	if (isWorkloadProfileNeeded()) {
	profile = new WorkloadProfile(buildProfile(inputRecordsRDD));
	LOG.info("Workload profile :" + profile);
	saveWorkloadProfileMetadataToInflight(profile, instantTime);
	}

	// partition using the insert partitioner
	final Partitioner partitioner = getPartitioner(profile);
	JavaRDD<HoodieRecord<T>> partitionedRecords = partition(inputRecordsRDD, partitioner);
	JavaRDD<WriteStatus> writeStatusRDD = partitionedRecords.mapPartitionsWithIndex((partition, recordItr) -> {
	if (WriteOperationType.isChangingRecords(operationType)) {
	return handleUpsertPartition(instantTime, partition, recordItr, partitioner);
	} else {
	return handleInsertPartition(instantTime, partition, recordItr, partitioner);
	}
	}, true).flatMap(List::iterator);

	updateIndexAndCommitIfNeeded(writeStatusRDD, result);
	return result;
	}

	private Pair<HashMap<String, WorkloadStat>, WorkloadStat> buildProfile(JavaRDD<HoodieRecord<T>> inputRecordsRDD) {
	HashMap<String, WorkloadStat> partitionPathStatMap = new HashMap<>();
	WorkloadStat globalStat = new WorkloadStat();

	// group the records by partitionPath + currentLocation combination, count the number of
	// records in each partition
	Map<Tuple2<String, Option<HoodieRecordLocation>>, Long> partitionLocationCounts = inputRecordsRDD
	.mapToPair(record -> new Tuple2<>(
	new Tuple2<>(record.getPartitionPath(), Option.ofNullable(record.getCurrentLocation())), record))
	.countByKey();

	// count the number of both inserts and updates in each partition, update the counts to workLoadStats
	for (Map.Entry<Tuple2<String, Option<HoodieRecordLocation>>, Long> e : partitionLocationCounts.entrySet()) {
	String partitionPath = e.getKey()._1();
	Long count = e.getValue();
	Option<HoodieRecordLocation> locOption = e.getKey()._2();

	if (!partitionPathStatMap.containsKey(partitionPath)) {
	partitionPathStatMap.put(partitionPath, new WorkloadStat());
	}

	if (locOption.isPresent()) {
	// update
	partitionPathStatMap.get(partitionPath).addUpdates(locOption.get(), count);
	globalStat.addUpdates(locOption.get(), count);
	} else {
	// insert
	partitionPathStatMap.get(partitionPath).addInserts(count);
	globalStat.addInserts(count);
	}
	}
	return Pair.of(partitionPathStatMap, globalStat);
	}

	protected Partitioner getPartitioner(WorkloadProfile profile) {
	if (WriteOperationType.isChangingRecords(operationType)) {
	return getUpsertPartitioner(profile);
	} else {
	return getInsertPartitioner(profile);
	}
	}

	private JavaRDD<HoodieRecord<T>> partition(JavaRDD<HoodieRecord<T>> dedupedRecords, Partitioner partitioner) {
	JavaPairRDD<Tuple2, HoodieRecord<T>> mappedRDD = dedupedRecords.mapToPair(
	record -> new Tuple2<>(new Tuple2<>(record.getKey(), Option.ofNullable(record.getCurrentLocation())), record));

	JavaPairRDD<Tuple2, HoodieRecord<T>> partitionedRDD;
	if (table.requireSortedRecords()) {
	// Partition and sort within each partition as a single step. This is faster than partitioning first and then
	// applying a sort.
	Comparator<Tuple2> comparator = (Comparator<Tuple2> & Serializable)(t1, t2) -> {
	HoodieKey key1 = (HoodieKey) t1._1;
	HoodieKey key2 = (HoodieKey) t2._1;
	return key1.getRecordKey().compareTo(key2.getRecordKey());
	};

	partitionedRDD = mappedRDD.repartitionAndSortWithinPartitions(partitioner, comparator);
	} else {
	// Partition only
	partitionedRDD = mappedRDD.partitionBy(partitioner);
	}

	return partitionedRDD.map(Tuple2::_2);
	}

	protected void updateIndexAndCommitIfNeeded(JavaRDD<WriteStatus> writeStatusRDD, HoodieWriteMetadata result) {
	// cache writeStatusRDD before updating index, so that all actions before this are not triggered again for future
	// RDD actions that are performed after updating the index.
	writeStatusRDD = writeStatusRDD.persist(SparkMemoryUtils.getWriteStatusStorageLevel(config.getProps()));
	Instant indexStartTime = Instant.now();
	// Update the index back
	JavaRDD<WriteStatus> statuses = table.getIndex().updateLocation(writeStatusRDD, context, table);
	result.setIndexUpdateDuration(Duration.between(indexStartTime, Instant.now()));
	result.setWriteStatuses(statuses);
	result.setPartitionToReplaceFileIds(getPartitionToReplacedFileIds(statuses));
	commitOnAutoCommit(result);
	}

	protected String getCommitActionType() {
	return table.getMetaClient().getCommitActionType();
	}

	@Override
	protected void commit(Option<Map<String, String>> extraMetadata, HoodieWriteMetadata<JavaRDD<WriteStatus>> result) {
	commit(extraMetadata, result, result.getWriteStatuses().map(WriteStatus::getStat).collect());
	}

	protected void commit(Option<Map<String, String>> extraMetadata, HoodieWriteMetadata<JavaRDD<WriteStatus>> result, List<HoodieWriteStat> writeStats) {
	String actionType = getCommitActionType();
	LOG.info("Committing " + instantTime + ", action Type " + actionType);
	result.setCommitted(true);
	result.setWriteStats(writeStats);
	// Finalize write
	finalizeWrite(instantTime, writeStats, result);

	try {
	LOG.info("Committing " + instantTime + ", action Type " + getCommitActionType());
	HoodieActiveTimeline activeTimeline = table.getActiveTimeline();
	HoodieCommitMetadata metadata = CommitUtils.buildMetadata(writeStats, result.getPartitionToReplaceFileIds(),
	extraMetadata, operationType, getSchemaToStoreInCommit(), getCommitActionType());

	activeTimeline.saveAsComplete(new HoodieInstant(true, getCommitActionType(), instantTime),
	Option.of(metadata.toJsonString().getBytes(StandardCharsets.UTF_8)));
	LOG.info("Committed " + instantTime);
	result.setCommitMetadata(Option.of(metadata));
	} catch (IOException e) {
	throw new HoodieCommitException("Failed to complete commit " + config.getBasePath() + " at time " + instantTime,
	e);
	}
	}

	protected Map<String, List<String>> getPartitionToReplacedFileIds(JavaRDD<WriteStatus> writeStatuses) {
	return Collections.emptyMap();
	}

	@SuppressWarnings("unchecked")
	protected Iterator<List<WriteStatus>> handleUpsertPartition(String instantTime, Integer partition, Iterator recordItr,
	Partitioner partitioner) {
	UpsertPartitioner upsertPartitioner = (UpsertPartitioner) partitioner;
	BucketInfo binfo = upsertPartitioner.getBucketInfo(partition);
	BucketType btype = binfo.bucketType;
	try {
	if (btype.equals(BucketType.INSERT)) {
	return handleInsert(binfo.fileIdPrefix, recordItr);
	} else if (btype.equals(BucketType.UPDATE)) {
	return handleUpdate(binfo.partitionPath, binfo.fileIdPrefix, recordItr);
	} else {
	throw new HoodieUpsertException("Unknown bucketType " + btype + " for partition :" + partition);
	}
	} catch (Throwable t) {
	String msg = "Error upserting bucketType " + btype + " for partition :" + partition;
	LOG.error(msg, t);
	throw new HoodieUpsertException(msg, t);
	}
	}

	protected Iterator<List<WriteStatus>> handleInsertPartition(String instantTime, Integer partition, Iterator recordItr,
	Partitioner partitioner) {
	return handleUpsertPartition(instantTime, partition, recordItr, partitioner);
	}

	@Override
	public Iterator<List<WriteStatus>> handleUpdate(String partitionPath, String fileId,
	Iterator<HoodieRecord<T>> recordItr)
	throws IOException {
	// This is needed since sometimes some buckets are never picked in getPartition() and end up with 0 records
	if (!recordItr.hasNext()) {
	LOG.info("Empty partition with fileId => " + fileId);
	return Collections.singletonList((List<WriteStatus>) Collections.EMPTY_LIST).iterator();
	}
	// these are updates
	HoodieMergeHandle upsertHandle = getUpdateHandle(partitionPath, fileId, recordItr);
	return handleUpdateInternal(upsertHandle, fileId);
	}

	public Iterator<List<WriteStatus>> handleUpdate(String partitionPath, String fileId,
	Map<String, HoodieRecord<T>> keyToNewRecords,
	HoodieBaseFile oldDataFile) throws IOException {
	// these are updates
	HoodieMergeHandle upsertHandle = getUpdateHandle(partitionPath, fileId, keyToNewRecords, oldDataFile);
	return handleUpdateInternal(upsertHandle, fileId);
	}

	protected Iterator<List<WriteStatus>> handleUpdateInternal(HoodieMergeHandle upsertHandle, String fileId)
	throws IOException {
	if (upsertHandle.getOldFilePath() == null) {
	throw new HoodieUpsertException(
	"Error in finding the old file path at commit " + instantTime + " for fileId: " + fileId);
	} else {
	SparkMergeHelper.newInstance().runMerge(table, upsertHandle);
	}

	// TODO(vc): This needs to be revisited
	if (upsertHandle.getWriteStatus().getPartitionPath() == null) {
	LOG.info("Upsert Handle has partition path as null " + upsertHandle.getOldFilePath() + ", "
	+ upsertHandle.getWriteStatus());
	}
	return Collections.singletonList(Collections.singletonList(upsertHandle.getWriteStatus())).iterator();
	}

	protected HoodieMergeHandle getUpdateHandle(String partitionPath, String fileId, Iterator<HoodieRecord<T>> recordItr) {
	if (table.requireSortedRecords()) {
	return new HoodieSortedMergeHandle<>(config, instantTime, (HoodieSparkTable) table, recordItr, partitionPath, fileId, taskContextSupplier);
	} else {
	return new HoodieMergeHandle<>(config, instantTime, table, recordItr, partitionPath, fileId, taskContextSupplier);
	}
	}

	protected HoodieMergeHandle getUpdateHandle(String partitionPath, String fileId,
	Map<String, HoodieRecord<T>> keyToNewRecords,
	HoodieBaseFile dataFileToBeMerged) {
	return new HoodieMergeHandle<>(config, instantTime, table, keyToNewRecords,
	partitionPath, fileId, dataFileToBeMerged, taskContextSupplier);
	}

	@Override
	public Iterator<List<WriteStatus>> handleInsert(String idPfx, Iterator<HoodieRecord<T>> recordItr)
	throws Exception {
	// This is needed since sometimes some buckets are never picked in getPartition() and end up with 0 records
	if (!recordItr.hasNext()) {
	LOG.info("Empty partition");
	return Collections.singletonList((List<WriteStatus>) Collections.EMPTY_LIST).iterator();
	}
	return new SparkLazyInsertIterable(recordItr, true, config, instantTime, table, idPfx,
	taskContextSupplier, new CreateHandleFactory<>());
	}

	public Partitioner getUpsertPartitioner(WorkloadProfile profile) {
	if (profile == null) {
	throw new HoodieUpsertException("Need workload profile to construct the upsert partitioner.");
	}
	return new UpsertPartitioner(profile, context, table, config);
	}

	public Partitioner getInsertPartitioner(WorkloadProfile profile) {
	return getUpsertPartitioner(profile);
	}

	}