/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.lucene.util.packed;


import java.io.IOException;
import java.util.Arrays;

import org.apache.lucene.store.IndexInput;
import org.apache.lucene.store.RandomAccessInput;
import org.apache.lucene.util.Accountable;
import org.apache.lucene.util.LongValues;
import org.apache.lucene.util.RamUsageEstimator;

Retrieves an instance previously written by DirectMonotonicWriter.
See Also:
/** * Retrieves an instance previously written by {@link DirectMonotonicWriter}. * @see DirectMonotonicWriter */
public final class DirectMonotonicReader extends LongValues implements Accountable { private static final long BASE_RAM_BYTES_USED = RamUsageEstimator.shallowSizeOfInstance(DirectMonotonicReader.class);
An instance that always returns 0.
/** An instance that always returns {@code 0}. */
private static final LongValues EMPTY = new LongValues() { @Override public long get(long index) { return 0; } };
In-memory metadata that needs to be kept around for DirectMonotonicReader to read data from disk.
/** In-memory metadata that needs to be kept around for * {@link DirectMonotonicReader} to read data from disk. */
public static class Meta implements Accountable { private static final long BASE_RAM_BYTES_USED = RamUsageEstimator.shallowSizeOfInstance(Meta.class); final int blockShift; final int numBlocks; final long[] mins; final float[] avgs; final byte[] bpvs; final long[] offsets; Meta(long numValues, int blockShift) { this.blockShift = blockShift; long numBlocks = numValues >>> blockShift; if ((numBlocks << blockShift) < numValues) { numBlocks += 1; } this.numBlocks = (int) numBlocks; this.mins = new long[this.numBlocks]; this.avgs = new float[this.numBlocks]; this.bpvs = new byte[this.numBlocks]; this.offsets = new long[this.numBlocks]; } @Override public long ramBytesUsed() { return BASE_RAM_BYTES_USED + RamUsageEstimator.sizeOf(mins) + RamUsageEstimator.sizeOf(avgs) + RamUsageEstimator.sizeOf(bpvs) + RamUsageEstimator.sizeOf(offsets); } }
Load metadata from the given IndexInput. @see DirectMonotonicReader#getInstance(Meta, RandomAccessInput)
/** Load metadata from the given {@link IndexInput}. * @see DirectMonotonicReader#getInstance(Meta, RandomAccessInput) */
public static Meta loadMeta(IndexInput metaIn, long numValues, int blockShift) throws IOException { Meta meta = new Meta(numValues, blockShift); for (int i = 0; i < meta.numBlocks; ++i) { meta.mins[i] = metaIn.readLong(); meta.avgs[i] = Float.intBitsToFloat(metaIn.readInt()); meta.offsets[i] = metaIn.readLong(); meta.bpvs[i] = metaIn.readByte(); } return meta; }
Retrieves an instance from the specified slice.
/** * Retrieves an instance from the specified slice. */
public static DirectMonotonicReader getInstance(Meta meta, RandomAccessInput data) throws IOException { final LongValues[] readers = new LongValues[meta.numBlocks]; for (int i = 0; i < meta.mins.length; ++i) { if (meta.bpvs[i] == 0) { readers[i] = EMPTY; } else { readers[i] = DirectReader.getInstance(data, meta.bpvs[i], meta.offsets[i]); } } return new DirectMonotonicReader(meta.blockShift, readers, meta.mins, meta.avgs, meta.bpvs); } private final int blockShift; private final LongValues[] readers; private final long[] mins; private final float[] avgs; private final byte[] bpvs; private final int nonZeroBpvs; private DirectMonotonicReader(int blockShift, LongValues[] readers, long[] mins, float[] avgs, byte[] bpvs) { this.blockShift = blockShift; this.readers = readers; this.mins = mins; this.avgs = avgs; this.bpvs = bpvs; if (readers.length != mins.length || readers.length != avgs.length || readers.length != bpvs.length) { throw new IllegalArgumentException(); } int nonZeroBpvs = 0; for (byte b : bpvs) { if (b != 0) { nonZeroBpvs++; } } this.nonZeroBpvs = nonZeroBpvs; } @Override public long get(long index) { final int block = (int) (index >>> blockShift); final long blockIndex = index & ((1 << blockShift) - 1); final long delta = readers[block].get(blockIndex); return mins[block] + (long) (avgs[block] * blockIndex) + delta; }
Get lower/upper bounds for the value at a given index without hitting the direct reader.
/** Get lower/upper bounds for the value at a given index without hitting the direct reader. */
private long[] getBounds(long index) { final int block = Math.toIntExact(index >>> blockShift); final long blockIndex = index & ((1 << blockShift) - 1); final long lowerBound = mins[block] + (long) (avgs[block] * blockIndex); final long upperBound = lowerBound + (1L << bpvs[block]) - 1; if (bpvs[block] == 64 || upperBound < lowerBound) { // overflow return new long[] { Long.MIN_VALUE, Long.MAX_VALUE }; } else { return new long[] { lowerBound, upperBound }; } }
Return the index of a key if it exists, or its insertion point otherwise like Arrays.binarySearch(long[], int, int, long).
See Also:
/** * Return the index of a key if it exists, or its insertion point otherwise * like {@link Arrays#binarySearch(long[], int, int, long)}. * * @see Arrays#binarySearch(long[], int, int, long) */
public long binarySearch(long fromIndex, long toIndex, long key) { if (fromIndex < 0 || fromIndex > toIndex) { throw new IllegalArgumentException("fromIndex=" + fromIndex + ",toIndex=" + toIndex); } long lo = fromIndex; long hi = toIndex - 1; while (lo <= hi) { final long mid = (lo + hi) >>> 1; // Try to run as many iterations of the binary search as possible without // hitting the direct readers, since they might hit a page fault. final long[] bounds = getBounds(mid); if (bounds[1] < key) { lo = mid + 1; } else if (bounds[0] > key) { hi = mid - 1; } else { final long midVal = get(mid); if (midVal < key) { lo = mid + 1; } else if (midVal > key) { hi = mid - 1; } else { return mid; } } } return -1 - lo; } @Override public long ramBytesUsed() { // Don't include meta, which should be accounted separately return BASE_RAM_BYTES_USED + RamUsageEstimator.shallowSizeOf(readers) + // Assume empty objects for the readers nonZeroBpvs * RamUsageEstimator.alignObjectSize(RamUsageEstimator.NUM_BYTES_ARRAY_HEADER); } }