blob: f6de3f8490a560c5843639c9b77c5b80f7518e05 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more contributor license
* agreements. See the NOTICE file distributed with this work for additional information regarding
* copyright ownership. The ASF licenses this file to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance with the License. You may obtain a
* copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software distributed under the License
* is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
* or implied. See the License for the specific language governing permissions and limitations under
* the License.
*/
package org.apache.fluo.accumulo.iterators;
import java.io.IOException;
import java.util.Collection;
import java.util.Map;
import org.apache.accumulo.core.client.IteratorSetting;
import org.apache.accumulo.core.data.ByteSequence;
import org.apache.accumulo.core.data.Key;
import org.apache.accumulo.core.data.PartialKey;
import org.apache.accumulo.core.data.Range;
import org.apache.accumulo.core.data.Value;
import org.apache.accumulo.core.iterators.IteratorEnvironment;
import org.apache.accumulo.core.iterators.SortedKeyValueIterator;
import org.apache.fluo.accumulo.util.ColumnConstants;
import org.apache.fluo.accumulo.util.ColumnType;
import org.apache.fluo.accumulo.util.ReadLockUtil;
import org.apache.fluo.accumulo.values.DelReadLockValue;
import org.apache.fluo.accumulo.values.WriteValue;
/**
*
*/
public class PrewriteIterator implements SortedKeyValueIterator<Key, Value> {
private static final String TIMESTAMP_OPT = "timestampOpt";
private static final String CHECK_ACK_OPT = "checkAckOpt";
private static final String NTFY_TIMESTAMP_OPT = "ntfyTsOpt";
private static final String READ_LOCK_OPT = "readLock";
private TimestampSkippingIterator source;
private long snaptime;
boolean hasTop = false;
boolean checkAck = false;
long ntfyTimestamp = -1;
boolean readlock;
public static void setSnaptime(IteratorSetting cfg, long time) {
if (time < 0 || (ColumnConstants.PREFIX_MASK & time) != 0) {
throw new IllegalArgumentException();
}
cfg.addOption(TIMESTAMP_OPT, time + "");
}
public static void setReadlock(IteratorSetting cfg) {
cfg.addOption(READ_LOCK_OPT, Boolean.TRUE.toString());
}
public static void enableAckCheck(IteratorSetting cfg, long timestamp) {
cfg.addOption(CHECK_ACK_OPT, Boolean.TRUE.toString());
cfg.addOption(NTFY_TIMESTAMP_OPT, timestamp + "");
}
@Override
public void init(SortedKeyValueIterator<Key, Value> source, Map<String, String> options,
IteratorEnvironment env) throws IOException {
this.source = new TimestampSkippingIterator(source);
this.snaptime = Long.parseLong(options.get(TIMESTAMP_OPT));
if (options.containsKey(CHECK_ACK_OPT)) {
this.checkAck = Boolean.parseBoolean(options.get(CHECK_ACK_OPT));
this.ntfyTimestamp = Long.parseLong(options.get(NTFY_TIMESTAMP_OPT));
}
this.readlock = Boolean.parseBoolean(options.getOrDefault(READ_LOCK_OPT, "false"));
}
@Override
public boolean hasTop() {
return hasTop && source.hasTop();
}
@Override
public void next() throws IOException {
hasTop = false;
}
@Override
public void seek(Range range, Collection<ByteSequence> columnFamilies, boolean inclusive)
throws IOException {
Collection<ByteSequence> fams;
if (columnFamilies.isEmpty() && !inclusive) {
fams = SnapshotIterator.NOTIFY_CF_SET;
inclusive = false;
} else {
fams = columnFamilies;
}
Key endKey = new Key(range.getStartKey());
if (checkAck) {
endKey.setTimestamp(ColumnType.DATA.first());
} else {
endKey.setTimestamp(ColumnType.ACK.first());
}
// Tried seeking directly to WRITE_PREFIX, however this did not work well because of how
// TimestampSkippingIterator currently works. Currently, it can not remove the deleting iterator
// until after the first seek.
Range seekRange = new Range(range.getStartKey(), true, endKey, false);
source.seek(seekRange, fams, inclusive);
hasTop = false;
long invalidationTime = -1;
while (source.hasTop() && seekRange.getStartKey().equals(source.getTopKey(),
PartialKey.ROW_COLFAM_COLQUAL_COLVIS)) {
ColumnType colType = ColumnType.from(source.getTopKey());
long ts = source.getTopKey().getTimestamp() & ColumnConstants.TIMESTAMP_MASK;
switch (colType) {
case TX_DONE: {
// tried to make 1st seek go to WRITE_PREFIX, but this did not allow the DeleteIterator to
// be removed from the stack so it was slower.
source.skipToPrefix(seekRange.getStartKey(), ColumnType.WRITE);
break;
}
case WRITE: {
long timePtr = WriteValue.getTimestamp(source.getTopValue().get());
if (timePtr > invalidationTime) {
invalidationTime = timePtr;
}
if (ts >= snaptime) {
hasTop = true;
return;
}
source.skipToPrefix(seekRange.getStartKey(), ColumnType.DEL_LOCK);
break;
}
case DEL_LOCK: {
if (ts > invalidationTime) {
invalidationTime = ts;
if (ts >= snaptime) {
hasTop = true;
return;
}
}
if (readlock) {
source.skipToPrefix(seekRange.getStartKey(), ColumnType.LOCK);
} else {
source.skipToPrefix(seekRange.getStartKey(), ColumnType.RLOCK);
}
break;
}
case RLOCK: {
long lastDeleteTs = -1;
long rlts = ReadLockUtil.decodeTs(ts);
if (!readlock) {
while (rlts > invalidationTime && colType == ColumnType.RLOCK) {
if (ReadLockUtil.isDelete(ts)) {
// ignore rolled back read locks, these should never prevent a write lock
if (!DelReadLockValue.isRollback(source.getTopValue().get())) {
if (rlts >= snaptime) {
hasTop = true;
return;
} else {
long rlockCommitTs =
DelReadLockValue.getCommitTimestamp(source.getTopValue().get());
if (rlockCommitTs > snaptime) {
hasTop = true;
return;
}
}
}
lastDeleteTs = rlts;
} else {
if (rlts != lastDeleteTs) {
// this read lock is active
hasTop = true;
return;
}
}
source.next();
if (source.hasTop()) {
colType = ColumnType.from(source.getTopKey());
ts = source.getTopKey().getTimestamp() & ColumnConstants.TIMESTAMP_MASK;
rlts = ReadLockUtil.decodeTs(ts);
} else {
break;
}
}
}
if (source.hasTop() && (colType == ColumnType.RLOCK)) {
source.skipToPrefix(seekRange.getStartKey(), ColumnType.LOCK);
}
break;
}
case LOCK: {
if (ts > invalidationTime) {
// nothing supersedes this lock, therefore the column is locked
hasTop = true;
return;
}
if (checkAck) {
source.skipToPrefix(seekRange.getStartKey(), ColumnType.ACK);
} else {
// only ack and data left and not interested in either so stop looking
return;
}
break;
}
case DATA: {
// can stop looking
return;
}
case ACK: {
if (checkAck && ts > ntfyTimestamp) {
hasTop = true;
return;
} else {
// nothing else to look at in this column
return;
}
}
default:
throw new IllegalArgumentException();
}
}
}
@Override
public Key getTopKey() {
return source.getTopKey();
}
@Override
public Value getTopValue() {
return source.getTopValue();
}
@Override
public SortedKeyValueIterator<Key, Value> deepCopy(IteratorEnvironment env) {
// TODO Auto-generated method stub
return null;
}
}