| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.iotdb.db.pipe.event.common.tsfile; |
| |
| import org.apache.iotdb.commons.pipe.config.PipeConfig; |
| import org.apache.iotdb.commons.pipe.event.EnrichedEvent; |
| import org.apache.iotdb.commons.pipe.pattern.PipePattern; |
| import org.apache.iotdb.commons.pipe.task.meta.PipeTaskMeta; |
| import org.apache.iotdb.db.pipe.event.common.tablet.PipeRawTabletInsertionEvent; |
| import org.apache.iotdb.db.pipe.resource.PipeResourceManager; |
| import org.apache.iotdb.db.pipe.resource.memory.PipeMemoryBlock; |
| import org.apache.iotdb.db.pipe.resource.memory.PipeMemoryWeighUtil; |
| import org.apache.iotdb.db.pipe.resource.tsfile.PipeTsFileResourceManager; |
| import org.apache.iotdb.pipe.api.event.dml.insertion.TabletInsertionEvent; |
| import org.apache.iotdb.pipe.api.exception.PipeException; |
| |
| import org.apache.tsfile.enums.TSDataType; |
| import org.apache.tsfile.file.metadata.IDeviceID; |
| import org.apache.tsfile.file.metadata.PlainDeviceID; |
| import org.apache.tsfile.read.TsFileDeviceIterator; |
| import org.apache.tsfile.read.TsFileReader; |
| import org.apache.tsfile.read.TsFileSequenceReader; |
| import org.apache.tsfile.read.expression.IExpression; |
| import org.apache.tsfile.read.expression.impl.BinaryExpression; |
| import org.apache.tsfile.read.expression.impl.GlobalTimeExpression; |
| import org.apache.tsfile.read.filter.factory.TimeFilterApi; |
| import org.apache.tsfile.utils.Pair; |
| import org.apache.tsfile.write.record.Tablet; |
| import org.slf4j.Logger; |
| import org.slf4j.LoggerFactory; |
| |
| import java.io.File; |
| import java.io.IOException; |
| import java.util.ArrayList; |
| import java.util.HashMap; |
| import java.util.Iterator; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.NoSuchElementException; |
| import java.util.Objects; |
| |
| public class TsFileInsertionDataContainer implements AutoCloseable { |
| |
| private static final Logger LOGGER = LoggerFactory.getLogger(TsFileInsertionDataContainer.class); |
| |
| private final PipePattern pattern; // used to filter data |
| private final IExpression timeFilterExpression; // used to filter data |
| |
| private final PipeTaskMeta pipeTaskMeta; // used to report progress |
| private final EnrichedEvent sourceEvent; // used to report progress |
| |
| private final PipeMemoryBlock allocatedMemoryBlock; |
| |
| private final TsFileSequenceReader tsFileSequenceReader; |
| private final TsFileReader tsFileReader; |
| |
| private final Iterator<Map.Entry<IDeviceID, List<String>>> deviceMeasurementsMapIterator; |
| private final Map<IDeviceID, Boolean> deviceIsAlignedMap; |
| private final Map<String, TSDataType> measurementDataTypeMap; |
| |
| private boolean shouldParsePattern = false; |
| |
| public TsFileInsertionDataContainer( |
| File tsFile, PipePattern pattern, long startTime, long endTime) throws IOException { |
| this(tsFile, pattern, startTime, endTime, null, null); |
| } |
| |
| public TsFileInsertionDataContainer( |
| File tsFile, |
| PipePattern pattern, |
| long startTime, |
| long endTime, |
| PipeTaskMeta pipeTaskMeta, |
| EnrichedEvent sourceEvent) |
| throws IOException { |
| this.pattern = pattern; |
| timeFilterExpression = |
| (startTime == Long.MIN_VALUE && endTime == Long.MAX_VALUE) |
| ? null |
| : BinaryExpression.and( |
| new GlobalTimeExpression(TimeFilterApi.gtEq(startTime)), |
| new GlobalTimeExpression(TimeFilterApi.ltEq(endTime))); |
| |
| this.pipeTaskMeta = pipeTaskMeta; |
| this.sourceEvent = sourceEvent; |
| |
| try { |
| final PipeTsFileResourceManager tsFileResourceManager = PipeResourceManager.tsfile(); |
| final Map<IDeviceID, List<String>> deviceMeasurementsMap; |
| |
| // TsFileReader is not thread-safe, so we need to create it here and close it later. |
| long memoryRequiredInBytes = |
| PipeConfig.getInstance().getPipeMemoryAllocateForTsFileSequenceReaderInBytes(); |
| tsFileSequenceReader = new TsFileSequenceReader(tsFile.getPath(), true, true); |
| tsFileReader = new TsFileReader(tsFileSequenceReader); |
| |
| if (tsFileResourceManager.cacheObjectsIfAbsent(tsFile)) { |
| // These read-only objects can be found in cache. |
| deviceIsAlignedMap = tsFileResourceManager.getDeviceIsAlignedMapFromCache(tsFile); |
| measurementDataTypeMap = tsFileResourceManager.getMeasurementDataTypeMapFromCache(tsFile); |
| deviceMeasurementsMap = tsFileResourceManager.getDeviceMeasurementsMapFromCache(tsFile); |
| } else { |
| // We need to create these objects here and remove them later. |
| deviceIsAlignedMap = readDeviceIsAlignedMap(); |
| memoryRequiredInBytes += PipeMemoryWeighUtil.memoryOfIDeviceId2Bool(deviceIsAlignedMap); |
| |
| measurementDataTypeMap = tsFileSequenceReader.getFullPathDataTypeMap(); |
| memoryRequiredInBytes += PipeMemoryWeighUtil.memoryOfStr2TSDataType(measurementDataTypeMap); |
| |
| deviceMeasurementsMap = tsFileSequenceReader.getDeviceMeasurementsMap(); |
| memoryRequiredInBytes += |
| PipeMemoryWeighUtil.memoryOfIDeviceID2StrList(deviceMeasurementsMap); |
| } |
| allocatedMemoryBlock = PipeResourceManager.memory().forceAllocate(memoryRequiredInBytes); |
| |
| deviceMeasurementsMapIterator = |
| filterDeviceMeasurementsMapByPattern(deviceMeasurementsMap).entrySet().iterator(); |
| |
| // No longer need this. Help GC. |
| tsFileSequenceReader.clearCachedDeviceMetadata(); |
| } catch (Exception e) { |
| close(); |
| throw e; |
| } |
| } |
| |
| private Map<IDeviceID, List<String>> filterDeviceMeasurementsMapByPattern( |
| Map<IDeviceID, List<String>> originalDeviceMeasurementsMap) { |
| final Map<IDeviceID, List<String>> filteredDeviceMeasurementsMap = new HashMap<>(); |
| for (Map.Entry<IDeviceID, List<String>> entry : originalDeviceMeasurementsMap.entrySet()) { |
| final String deviceId = ((PlainDeviceID) entry.getKey()).toStringID(); |
| |
| // case 1: for example, pattern is root.a.b or pattern is null and device is root.a.b.c |
| // in this case, all data can be matched without checking the measurements |
| if (Objects.isNull(pattern) || pattern.isRoot() || pattern.coversDevice(deviceId)) { |
| if (!entry.getValue().isEmpty()) { |
| filteredDeviceMeasurementsMap.put(new PlainDeviceID(deviceId), entry.getValue()); |
| } |
| } |
| |
| // case 2: for example, pattern is root.a.b.c and device is root.a.b |
| // in this case, we need to check the full path |
| else if (pattern.mayOverlapWithDevice(deviceId)) { |
| final List<String> filteredMeasurements = new ArrayList<>(); |
| |
| for (final String measurement : entry.getValue()) { |
| if (pattern.matchesMeasurement(deviceId, measurement)) { |
| filteredMeasurements.add(measurement); |
| } else { |
| // Parse pattern iff there are measurements filtered out |
| shouldParsePattern = true; |
| } |
| } |
| |
| if (!filteredMeasurements.isEmpty()) { |
| filteredDeviceMeasurementsMap.put(new PlainDeviceID(deviceId), filteredMeasurements); |
| } |
| } |
| |
| // case 3: for example, pattern is root.a.b.c and device is root.a.b.d |
| // in this case, no data can be matched |
| else { |
| // Parse pattern iff there are measurements filtered out |
| shouldParsePattern = true; |
| } |
| } |
| |
| return filteredDeviceMeasurementsMap; |
| } |
| |
| private Map<IDeviceID, Boolean> readDeviceIsAlignedMap() throws IOException { |
| final Map<IDeviceID, Boolean> deviceIsAlignedResultMap = new HashMap<>(); |
| final TsFileDeviceIterator deviceIsAlignedIterator = |
| tsFileSequenceReader.getAllDevicesIteratorWithIsAligned(); |
| while (deviceIsAlignedIterator.hasNext()) { |
| final Pair<IDeviceID, Boolean> deviceIsAlignedPair = deviceIsAlignedIterator.next(); |
| deviceIsAlignedResultMap.put(deviceIsAlignedPair.getLeft(), deviceIsAlignedPair.getRight()); |
| } |
| return deviceIsAlignedResultMap; |
| } |
| |
| /** @return {@link TabletInsertionEvent} in a streaming way */ |
| public Iterable<TabletInsertionEvent> toTabletInsertionEvents() { |
| return () -> |
| new Iterator<TabletInsertionEvent>() { |
| |
| private TsFileInsertionDataTabletIterator tabletIterator = null; |
| |
| @Override |
| public boolean hasNext() { |
| while (tabletIterator == null || !tabletIterator.hasNext()) { |
| if (!deviceMeasurementsMapIterator.hasNext()) { |
| close(); |
| return false; |
| } |
| |
| final Map.Entry<IDeviceID, List<String>> entry = deviceMeasurementsMapIterator.next(); |
| |
| try { |
| tabletIterator = |
| new TsFileInsertionDataTabletIterator( |
| tsFileReader, |
| measurementDataTypeMap, |
| ((PlainDeviceID) entry.getKey()).toStringID(), |
| entry.getValue(), |
| timeFilterExpression); |
| } catch (IOException e) { |
| close(); |
| throw new PipeException("failed to create TsFileInsertionDataTabletIterator", e); |
| } |
| } |
| |
| return true; |
| } |
| |
| @Override |
| public TabletInsertionEvent next() { |
| if (!hasNext()) { |
| close(); |
| throw new NoSuchElementException(); |
| } |
| |
| final Tablet tablet = tabletIterator.next(); |
| final boolean isAligned = |
| deviceIsAlignedMap.getOrDefault(new PlainDeviceID(tablet.deviceId), false); |
| |
| final TabletInsertionEvent next; |
| if (!hasNext()) { |
| next = |
| new PipeRawTabletInsertionEvent( |
| tablet, |
| isAligned, |
| sourceEvent != null ? sourceEvent.getPipeName() : null, |
| pipeTaskMeta, |
| sourceEvent, |
| true); |
| close(); |
| } else { |
| next = |
| new PipeRawTabletInsertionEvent( |
| tablet, |
| isAligned, |
| sourceEvent != null ? sourceEvent.getPipeName() : null, |
| pipeTaskMeta, |
| sourceEvent, |
| false); |
| } |
| return next; |
| } |
| }; |
| } |
| |
| public boolean shouldParsePattern() { |
| return shouldParsePattern; |
| } |
| |
| @Override |
| public void close() { |
| try { |
| if (tsFileReader != null) { |
| tsFileReader.close(); |
| } |
| } catch (IOException e) { |
| LOGGER.warn("Failed to close TsFileReader", e); |
| } |
| |
| try { |
| if (tsFileSequenceReader != null) { |
| tsFileSequenceReader.close(); |
| } |
| } catch (IOException e) { |
| LOGGER.warn("Failed to close TsFileSequenceReader", e); |
| } |
| |
| if (allocatedMemoryBlock != null) { |
| allocatedMemoryBlock.close(); |
| } |
| } |
| } |