/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.cassandra.db.transform;

import org.apache.cassandra.config.CFMetaData;
import org.apache.cassandra.db.Clustering;
import org.apache.cassandra.db.DeletionTime;
import org.apache.cassandra.db.ReadExecutionController;
import org.apache.cassandra.db.partitions.UnfilteredPartitionIterator;
import org.apache.cassandra.db.rows.*;

A transformation that appends an RT bound marker to row iterators in case they don't have one. This used to happen, for example, in ReadCommand.executeLocally(ReadExecutionController) if DataLimits stopped the iterator on a live row that was enclosed in an older RT. If we don't do this, and send a response without the closing bound, we can break read/short read protection read isolation, and potentially cause data loss. See CASSANDRA-14515 for context.
/** * A transformation that appends an RT bound marker to row iterators in case they don't have one. * * This used to happen, for example, in {@link org.apache.cassandra.db.ReadCommand#executeLocally(ReadExecutionController)} * if {@link org.apache.cassandra.db.filter.DataLimits} stopped the iterator on a live row that was enclosed in an * older RT. * * If we don't do this, and send a response without the closing bound, we can break read/short read protection read * isolation, and potentially cause data loss. * * See CASSANDRA-14515 for context. */
public final class RTBoundCloser extends Transformation<UnfilteredRowIterator> { private RTBoundCloser() { } public static UnfilteredPartitionIterator close(UnfilteredPartitionIterator partitions) { return Transformation.apply(partitions, new RTBoundCloser()); } public static UnfilteredRowIterator close(UnfilteredRowIterator partition) { RowsTransformation transformation = new RowsTransformation(partition); return Transformation.apply(MoreRows.extend(partition, transformation, partition.columns()), transformation); } @Override public UnfilteredRowIterator applyToPartition(UnfilteredRowIterator partition) { RowsTransformation transformation = new RowsTransformation(partition); return Transformation.apply(MoreRows.extend(partition, transformation, partition.columns()), transformation); } private final static class RowsTransformation extends Transformation implements MoreRows<UnfilteredRowIterator> { private final UnfilteredRowIterator partition; private Clustering lastRowClustering; private DeletionTime openMarkerDeletionTime; private RowsTransformation(UnfilteredRowIterator partition) { this.partition = partition; } @Override public Row applyToRow(Row row) { lastRowClustering = row.clustering(); return row; } @Override public RangeTombstoneMarker applyToMarker(RangeTombstoneMarker marker) { openMarkerDeletionTime = marker.isOpen(partition.isReverseOrder()) ? marker.openDeletionTime(partition.isReverseOrder()) : null; lastRowClustering = null; return marker; } @Override public UnfilteredRowIterator moreContents() { // there is no open RT in the stream - nothing for us to do if (null == openMarkerDeletionTime) return null; /* * there *is* an open RT in the stream, but there have been no rows after the opening bound - this must * never happen in scenarios where RTBoundCloser is meant to be used; the last encountered clustering * should be either a closing bound marker - if the iterator was exhausted fully - or a live row - if * DataLimits stopped it short in the middle of an RT. */ if (null == lastRowClustering) { CFMetaData metadata = partition.metadata(); String message = String.format("UnfilteredRowIterator for %s.%s has an open RT bound as its last item", metadata.ksName, metadata.cfName); throw new IllegalStateException(message); } // create an artificial inclusive closing RT bound with bound matching last seen row's clustering RangeTombstoneBoundMarker closingBound = RangeTombstoneBoundMarker.inclusiveClose(partition.isReverseOrder(), lastRowClustering.getRawValues(), openMarkerDeletionTime); return UnfilteredRowIterators.singleton(closingBound, partition.metadata(), partition.partitionKey(), partition.partitionLevelDeletion(), partition.columns(), partition.staticRow(), partition.isReverseOrder(), partition.stats()); } } }